diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f8318e9c7b71f8dc804200043e11acca0abf02a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44df01808a4f0e90ee142c2872ca474e170a7d258304ae68e3e08e7bebc26222 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c864cdcbfe1e7b6303354465672f5e839dd42b25 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72897fcb1883a79f45b18fff8f4bfe030be05d11edfb900ca888d5d24b271645 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c52c6450fa22091cf89660c920304423b5009602 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd3b21cb92dad72516a7d5301f79257a43e20d164ffacc3e3263cbd962b9d627 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56f4570f218376e1d536bb9a90aa8f7bdccd2655 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d112fd6d8ef1ab41d0862a39a9338fcd436b06447de3a3cca921bba7be24923 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cf9394df8ae64fab4849a6a4e6a31bd1a9181fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:256b6c3f38c466c6fd569d423108cefa458e5339cd1f362bc93be6262632f916 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..713ede00fbe486c77596def81245c608d555ea88 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad1a70f1370551a4ccc08f65b839ff92e38acaf72df22732968997898cd501c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4a43469ecfc3aa8dce52314d71824c7ba3d6463 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63ae6efa44e1afb28ed19d8f7c4f53e9380ab48b5c0543573be8d206020caa8d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5004bf2c0fcaeeccc52fdb87d29f735f3fb1e4cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ab97c3ee90f90b37596940f54dda1dda05c0b2ed31ecbbab09cd2604346091f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd9baba5b9b95228ffd3ff518e5349fac899528a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:792594cf0d2e2fdd958678a9d727129b727226f28039bc5394c1ea7a7b728f46 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ecf37c97f54109114a196dac12852755d6af2cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224f942b934b7b462fd3b93990de880a6cacce457e755a6d95bc6739cb427ed8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..690708d9a998c413ddbc4ef82843e2f657df2965 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0e7a813d98a9392bc73a3287b5c17fed5e7e7031fc955a4c40901ca7f97594b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7f95a0016f6c0ee85ba524accefc8f1f9a865da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cef0775ba7de833af3635b733dc60a1e0816a299c41d9f0bf00320638326c597 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7c9a177bc78bc4021bf3f1ad97b2d406dda8328 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5451abe781a12851cbf97f4d0fbd15196c2eab5f4f00fd73957d140114bdd4cd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6dcb340503c40a7eb48ae13ef795c26bd1a6ceb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca485d91ffbf04dffefcc76cac96a0bf0e8005ff31cb7ba6276e5a34b55765f0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc514bd2741cb80c175a7029ee11233c9390f701 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d9abcfe0260bbf0edc4622cfd2cb2465ac809de644918b63ee5210a6e8bc27 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ee4e9341d6a21cee8f67f955ad3ecf6499f1e5f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:371ca1746abbc37301d1ebe1ea7a48e25be63d23eccce1342c26d370bc2b1b9f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38ba85a129575393691a890ea197a22a50160e5d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b53261c6c6f1ae92dd7ea7ae91eea12bdb672c6539e0a313ba8818bc1dcec39e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4d153a6f71eb8bc63c5098dee3a556bb9ac0eab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2d9eb5da1097ed2a22d18be8f43d68d11c6d47f139ecb0020eb394f9485fca5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f88c841ba1295b533008910cc01f04ce6ec4e793 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8590c463b48a9c22112dde6c71c5e2719f0ae31bafc4ceedcbf3b17aae8d3ea1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4844fbe9145ea763f818a1873cd5e7c68332f36 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:719f64cf9a8dcaa9fafea020eb0d015242bbad9dc7bc4ecdc07b9171b26ab683 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1135bc54886fbe3a936c270938911e310a44394e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7f3e62f8c021d48773ad1daac7c6c82a1aa8c305bc52a8b029be33aa6cd8571 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2027f7680b7413db3bcbd72cb228b6ecba6f6fb0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c96bdcc319224a88ff1b6cf0afed19b8b164b879c8055c2af7797993d4e9e8bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d8ad29d5b435f9a45c4b565bbc7be1f7820f77b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9d1119490b6f0fc50e5884afc4ecc68f6c34831bec7e4c331c15f0c41cfbceb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a676087780756defb526de4ac2f72b4de1b8cf47 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36775adfba313c5f641fafdf224eae5c4674d9786e99d197123d4bd429addbc3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3d44d254075b0e4648497831108f27acd8f8eff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4b09dfbf36f98b21ecbd923fd66acb4e2af8eb98f789d1b6fd4a1956516650e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc6ce0f15c4298fbe0ab988a7abf9bdc888587c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4204d7c74e2606474eaab805a0d7b0ee0a5a69374aef881316e14d316c5be109 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..372b19286fb16cd77f8db7562028e0a3e20889dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0adccbc4b577bc3440f9b376df9fcfb773759dba7959b923a49dcf56dd49eaa0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9df2a297a87e678f75f8abd406e85646d874af0f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a043306b1955bd14fed7f574b3313c5f2e6a6d289a54944c00033cd5c7a5996b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1767672a2a4a4a47a20cb0c2d7380802d8afd314 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca80e59a09754f2b9f6e3e0610cecf57bab92c05d327c8dd0adcead5ca52a123 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe78784dab4154afac93af276fa0acb217433de4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54788de82efafaa17deef1dc877e9e2c2b2b379331c8f6fe6643d8c93a801cb5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b833f49cdaacc944ebaba3df808b6b5844f7d5d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b127d491a1a9447c575da5a314b1996edb05be08049be4d13f4b890bfba3e2d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2904ba66cf40a801d06f016294d38392f5e693a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d17c0aee8aa569082e477a01b0b891a05214f781eac971036a23bc144734877 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9d9daca84ec03259691f3c47762cf2409334a6e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa63688cb3c4a6da0dfe0c7cd7407831523a4d9b32e1331dfe4647cb03b296e3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fff6e2015414d93bb76dc3db6fa8a30aede4e0e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d9fa1256080c8c546e120bc4d7d047cd8c93127fc3fd6f85c9a31332ab559d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02a5560fff5380bedd310fc50e89103c334c0bfa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f1100a97440be356d91af461ea77eccd02f43ae52930fe3eef98d0d74c003b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e224777f3e8086355b877f3fe0de665ba9d34f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5124e51e5c9c28f329f542146923699380f801866881f24875c91776d5233c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b488bafd1ffcd9193a25ec82868973632bbc4319 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6be89b080d2ba087bd2259e7d1410d36558ab824bfd3ad44dc3fe3806b11e743 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d955ecdc6a674300647e7312a80d84a4127f560 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa3905841b561cd3f763fae468b90f91e86c79d9e4e31aacf40054d8d5b0330a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c8ec871d0a90194454166cd1b2cd8d8730a9150 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed9f5f4c26616af3d03c22c8f302b61ef0f0f5715996e6d81c74eb8045f1efae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36cf19f7a67562804ff8b7ac87e169d0d7e8c3db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2b7492e014f7327cc5d667a2ea6256eb39ed117a457da550c70ba16c238d505 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a418a83d977bfb4a038523077f99d24d403c2343 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14fca4a17f817d29321932ae63cf7db3d769fd1acd4f4feac4dfab5efb84af18 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ee7bf8290abe8fc20e07af8db454035e3ba881b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffa0c096c66f8200f37a8d95fe8c12f5820c1a697e94c03f1d76ee91b2410f93 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a86b9aab120211967c4bdfb7e76bd02ece34bcff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0365e677039bc8de954eae116e87850cb77c0072682228ac8f3ca03d6ea8bbca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32addee95f27e29d4d84f27b98f46c56f40f9374 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deb11772f648f4df4fdb5da1adb17ee46622dcbef9eefb1bd7e4ccf0014e4956 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cd031df3158dead24123f522af353d827968111 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e35fd336a72d86187a74e113f8cebfddbc3b783ee3b7f182918408e74ed233e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e0d4d4204692f715293e90d4c8091cde802fdf4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b7b5455078ae6f885d779fcbae808799289b17cbd88dc311a0e7a6913719376 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa8b1eac262d8915dfaf5cdbbee95b66f4dae616 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4ef51436559e70ea0992453032701c7ec94e45141e79894695b612cbe79d936 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3d65ac8e84c4232a69c29d719128244285055f2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f706ce793380b6b6190b7846b7211aac5ec5eb66d5d88361f149c3d3267253d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8fc6c90db20e99eea5ca7ebeccffda4401f9e09 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b7ffbee11e72b460c192b326c0a8f89feeaeaa538768c5f03b13f545f3ffe31 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c7ed7e84f0e1c3b75ea10f2576c63aa9742b7bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44dfe9ddf526cc2ac5cb882ebacdd9689dc8af49ea66c055b4f7f2a6383b739a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d52fa192d45291d369b22ea28b8b382808a286c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f66535e5f3cc9451aefc5e59148ca94037a4cccd2ec43a44fe487ffbdd174c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a5c2b69cc2e811faa39c9acb962859d831042e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:992c19fb736d53e34c9cad3e984b4cf9d0f7cf89d9a9da4d91af04587d8f3351 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c64da7255aa1e82479761b5c17eeda7de58c968 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03e7e764416c2db5a6049358b3ee9242746a47a85101e2a902d2a165b16b39a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9afb2c8c92990b274192c5f675f13e70c49896fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9f74dff5b41a207b3ecdb1830a378e9613c8e3da71e14130c8b16393e2c406a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cd9137c07d732c06dcf2c6c957ffcfc26a96710 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a461115293d6aacf0943f71aa749ccf69e0efe19f4ec2f312a37e8316a2f5ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..343e6bec8043caa6f803a11ae75428dab40877f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:570da46af538345546c47aed29ccda1bbccf35fd645d4206e12a8625e5d12902 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34309ee223e82db0fe9ec9ca242e6daccc665324 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61ac3095f91e167cfd6ccf8da04113c7e291a768c79211c6755199919c7c5495 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfb5cb5e84fd44587f814b6e3baa7890d49351d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a617e8baebcd7b3cf9feb02b867d36f5f9561e2af0a81eae2f521484abfd75fd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe8727d9d1bcfcef0fd8ca270fc7ebcdb2176db6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa34534f58d1132c0c25a241930f379b1adf6ad1089f8498dcbe7328991d831 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83f67b646f5a9a549b91ad29afdc261f505e2144 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fef4f9ed18f2ec4401bd61ee48891b1153210f31282fa0044287f89f430c42d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ba8d03f9c4794eabf9e258b363a6d0892819b2a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf23d4c08236cf0bde29456831287351b45cb180787b9b6908fd9d9a65317498 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffeb4912f7b395b32c0ad711b2f412059b73c188 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef25ed992c8c6e4341d538a65751eed1216f15f997cb492aed381e65c3c69be +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..148b68c96edc58c2a7bafe1adbeabfed52f417bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eafb4d8c2d5e2f0938d842a5bc9c28e5ae239af098d08e6cc58fc9b27e35552 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80c2c88dd21c1db680a9da29d6a95d48aedcc039 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea51049bedbd25215d3c58ee008285f12b0b3ead35e246e4e0895da0116bf2c1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..422b66aa71e7e3df5faf46762b52db0af0f877ee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f1c7f70d086b3c09883f45ac16bf3ef9770425904b18c580774db83d17129e7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fee22bfcdbc43a9720772485a31778eb0e25dbb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3516ae8516f08754338498bcf3c11446bb707e0987dcf44237398cc9145a8536 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53e16a5402cb8ffd0f0bde601757ffdf5429de94 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aae396e3cdbac2fcca2bc02737baf86c7cbbd9d61bdba172b0c58413762ba6a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a8aaed060f9d2571c06d48b904f7b7a4baf6172 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7821227b047633048b051d95cdc3f09ee6eeb31c70131cf9e021b063aefabf8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4cd04223960efaa1c670ca93acbb453f02e893e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:108040b5504363bc7d4ac996526f4ce757b616984fa7a9e22ee1c0b036863b81 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..251635c7dac7bbf9a536aa90f72517aeaad28d20 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c13c87afea14131102e2eff780a0604432480ec7b33e3267a4f70f29965afd8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eafb8a6322210275d1ee2e99dbc34fc60cd0b182 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9469cce4c2381581c0681e218976a1993b86ebd8c9a8ca717edae4bff18d9335 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca9cbeca366a1a6a689eae09d0c81663b7edb4af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d59382c04e7480a0e7b6cd3086ed08f4d39035430dafddffb8dcb4d8ab4ae036 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07de351e338209fc892f06f6544759a2c9d2efe1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b2079782036fc06b05d6c0d98eb4a9bd42ad2765a2b399d56bafd745633d41f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d81fd1ac9433c017b35c67238df490d11d96040 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bb41098e8fbbf04b0802f38130f0f8831776f8824a1cfd06966371f8095800c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c19761a5ef6e412c8e4a7f357d17148e276ec89 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05ed2b98ec7c8f30f09cd18430b0f328c68e62e59b2b61ddfaf54799bf67afdd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bedf7fd9c39e514f335132e0c2fd442588cdc21 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9cce791d3e1cba58e7ea5af195cf0858b0d6b9f223db87668952121455a1964 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7388de1ce5fb15f1f9af8c11a488ddebb2b1e13 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e2109157ed9b8ad121e21af4b2d079cde26854f4a55e8da784267d042833b21 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d95ffee892e812578cd20277a49af405782047d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be6a637c364e266e1dac76b6a215c7d12fac7e46045211b0f609253ef04bc5bb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa4a26b1b571663ae18fc9bf4d5da39d6bbee8a0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91badadacd4b3406cab09f6d5010e7f864c3dc48987f2bc0dc678e5c2afe1b2f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..002080695e30409bfbcd1dc85cbb4a757ceae736 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cca3856628aa513ce32df2a230ff01144c6be4d130a006b0b29b181f92bcafb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41092a92d968b80558bd461ea4f68de27b4ce267 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0416788f7b74df8cc0a0715a2076d4ccd431b120d06d2c82bd471d38e5b81a1a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93d3f6cf58c578229ba26e3201462b8d38c0bc2b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a98426a2ca02b8719ead9532056d2b46ecd0e159ed366ffe652d017ba371d8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eb289432eaa071380ddb00dd3bccb5fba3661d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4c7b901b8d5f545f187e4d8dad2031c6ada34fc4c2cdc0c30a393d6c51a887b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..212835eff236b5e5b4e8fcd220362104319dd5fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a108032d9c26c11ae2e51459654e9f5b9d64e1d790a33d48992df3f3c64f2a1a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc27ce52c1454a0acfa563329914690c12c5e372 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e367007228bc84e3a53764763261213d3528ba73606df5b62ae6d15fe4644fe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3258311a9bbc49a6575362a43ef45f188159ab4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:953cab26467c52b0dab73d26a237d191f687ae2d65e617a150fb2070dc31ce1d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1cbfe53b303f75c30444c4701aa5fc475f9da21 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92af4231885d58ca062366c9238584cbdf895e11725bbf021487b5f2dc38c0c5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff8a1668e577eb18d4e97ac06c4ad938b4fb5a46 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8637e0e7217d5ba46fa5dd1e8cdfe33c3533a098c304fc2eccff0090da030ba +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d5f4c0f48c58daef53948835aa6175651281a59 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db18dd98e5e1574440e4f0c78ba837ae8462f6e9cac4ae246ff2cee5fb7c0ff +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc6a0ea445dafe8744d8df9c2399aafa8c87c9dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db5678f971a1813269bb8fa11f5755ea2c1344b9f8b9f1941dc5a1516ac5528 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ade28f7d8e520c9c469dfb4ee2ee1226ad57172 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8ab051c2f7534614aed87dc844d38f201dab374fa9c48fe80e5ddf99591609a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4403d18dfb153b32981f8c7a07621f7fd31af582 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32cd70286f9195cfa7ca5585bcc63d82a5ebe2156839a8898d5b75699eaf5b54 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cbb33c065d5d5737494a86c9e0a1e98d54129f5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67306d07014db96c42dd284f81a9c2b7638976804cfe99886f6aeb1d47e61940 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7d088e784d782224948cd525690c863f468c66b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eafc94d2f21c46b55675d700af2e57acf52795ac18c95d902728ed39848ff5c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1035a901676e4119c75e59462af2a40779489883 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef24a858c328b5e64af6a6d3ae860f8adbd2f196929273b7ec6731abf7b6cf27 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72a9c0ad5f5945d4f31234d980a996090b941451 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5037ee23826e645998b54bcef3c44d73f2f66c05704deb41bfa4a54207f7948c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cceb66da46f40f05b3cf8bfa7b77341c34fe449 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5110de225675fb0839e108046c10fc98f716af561dbee8fce00c5900bb312e90 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebe6bfdec8597100e6a213d1351bd8005047fb46 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ece5af39b7d04205ddd7497e2fd13dd8ef8b9099b8710769f865769cd94fa71 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..824f55203cf4a7d97cb4b26f0504967ba1b35753 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f8a1c0079b59eb26656e4210b5f51eb0913c86fb692e4ce29d550c6971b93d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9406df02605cc4dee92c1939816c4deb0558ffa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19241049df51a667fcd2b35a104836305ac37c34f7fac40c198cc994fcbc867e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb29e07b57f9706ce3fc9fca29f1be141e01f52f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fa8bdc2f682a3ff94bd58955e48e22c20fe620577d66e69832a6037a0404663 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee7563a3b01372055fa1f86c6002ad005c61eb9f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:269d9f3b4f1182a6fde7b861a32a1acfc3d0c001e71d38e3b07dfb231e456bb2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca6e0e33cc01d0c43742c6c0cc4da1322580b002 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d94eeaa8b4c8989eb38e07e96a8852b14d76d105300282aa6ce3273d57d68b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8632ab6dd7ae7048600405f383f31128288258fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10ce7500fc9aee685f76eb31e02c96a491a1ddd63dd27a18cdb83a5c2700a913 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad2f916f17782668346a193571c93383b58d9e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b93e59de967df7dfd40b23f622280d3a21a6cfce301dfcc4c4cf1a6f9e2f3385 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9da6bfd7c6c4663d7ff86458b5a4f023d5b7f180 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95b4351aa3a73daa742a1812396f254c326102d6777dfddeef98074c5d466e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db60d01858794343c8c90a188f01945a05be224f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8dcde8b8c15e7357c0166fc47191bbfd4b2600410d12b904f060f6b95f753c2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79b185ca214e20e190acf3286115686044cd8315 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5612ffd5d6d83e49257e4e812d27d8f64588629c6757c6f0770719c5fe6d4f2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..595e44d30560bc2e2852f8a0ac60b7274182fb4b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f277ee869e1c4f4f0004d634b6861ee1d03d8cb92d2fb90abde5465de54c7682 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0510d43380a01cbe31d2bbda79ce6269b55d2225 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09895c6bfab4f0f21f819dcc4404e066e5e4297c05f7c7a85dc19d7e3a75aee9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1cb56a35941acae5e1606c0015ca7c63ec54a80 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:910372531fcc644c6bc3f3af8b04810cc938c215f0c01c3aa4714c5e792581b1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fd741a5d47c5df87170062ab9252945f505ff2b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7de6cdd76d24934a7ace3cc45c4a7306fb61c0da6acb36cd16d3b6ae1e15604a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..957187fceb42c8516f5b68f29a51057c4a77e3b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30d41aac517fcf510354192ec347f8c1ad442bde4db5b16e07f41c2f6f19f082 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf4fc0bb1f4210a318a590e547c4d14fb218632c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:385fd23249c03201f093a0d356c2b80f4b844247beca1b3c2a114252d66154af +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ce5385d174d4165d49b9d64b5c0b52cb15fba34 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8cf04ed2f1ff18d29964e59ca4277df25351ee1ed6afea2a897dbbb3fddd02a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c599cfbb291a2228fad11c7117169e4a19346cb0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee60059b77f5b46f28f26e0c045b865ba84c0b6963826a366c38c068a7382463 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47b728ea025bec372b920500e5441a545ef7a8e4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77631e593349372e45ff70ba11e65f3f8c775589b065385b7179f0fa59305979 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4cedd8f7046f57b1e808ee5927167d55f7ed174 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92fe37b3f816730e9ae5200bca1d81bc02f5804c6579da8cdbad18e471e25567 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b39e4cc688eb3c0ac8eb4e9d976cdbb6c5155277 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2b6e55b3c0756bc1ed4db88418d406a9a242b25615a5ceaa825a27d1f743631 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53cfe88e0cd8e25d63cd66dcdabf3f8538876740 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bcb5efd4e819cd70b572b8646d2762c5ff3bff97be901a0a6d81f9b026b69fc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50de4b7d174eee6ac01cd833f59437a596cb22ee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c4413d4c584fc1c47e2f98f3b7734ab227b4bec4188a4325eeeac702d3da38 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c036c802a06cb90e05f19c879dbf763a73401c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfd05c51a9bfa21a655dfb46a746de0d5f9f2ecc14b56fbba69c48825e48ffde +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f41997ea46af98dcb23508781d1a99b27c407bfb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fac8573f6c9bfed318faf8be29a911133c99bb240e400b207da118cf4fda05df +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28c92c323a336a3689a3fb9153117298113b10d5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9495b5c047611852fb74c2804368287ad50813bb21390cd79b7de70bed38f501 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..582a4cc2b664eae90382eafeaf9aacb9b020a823 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de8d33f03f29ecba1598a993a0de51c022769aea08513ff5236a83831ae22e59 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8de2a99e1657ee0670499582362ea336832dcfe5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8097022bb9467934c8e2b41bf00b280a3cda590b8296415c760d0beb40ba9ea7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17c5cda53fa720eebd3e6bc086dd5bbe1e8530e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95af60a977820ecd7e1579d1cf80abc9969a78e7ce80af6625002a1b15aabe6b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f177e0eb4a1b907dae634503f7e1f50a2ff59060 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20c1e06d0f0ce381d48efce85009c566be25c9567d334e82782bd0bb3af3d830 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3f222d910376d7ee9d97837eca22e64d95fdecf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed932fad2cfda87e576efd207fcb09bc8032226ad9dc7f7e0d377861a80b0e77 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6a11e59ac4e9ca1211d0926ce7d6dfb905e0752 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b575bf23c36e98322a2456978d82abfb78fefeb969c4047412e5a504dd51df3a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3154612b141b90e794a827467b8edfe2f207b48d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b3c00b9b35a065ef2c44a0a4e829fe4008b609d50b5c72b93a76da0b013e030 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb99f93bda5d85954ccb062e96520cf728971f62 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3676cafb83b866861871eb9a97b865694c6817e998043ccfb9359ae2de55e129 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a9c05dcf4170766a7c5b5dc94abf315dc5657a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d4b25f56318559ff712f3454e31eb3a6858c756ed9e3017fb439243640fdcf9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ee6b262f91d6c64db7938b081777ce085a8c785 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:940d4582fd5f01e76e959db4bfe3fc0dc79912b6433457aef383696a438a717b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2f3b89b3f71e864435c0294c0e6c2044ec1fd6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d3e295ea929545da5daf968a9be81cf970e9a4f4909849de4c18a5f1fb691b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df1c292f4f8b60425489689b24900a1922a5f339 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:840d90e716ac72c4611e8cc598a1cdbbd61840c9af297d8fb0e22a966c519a99 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5283e3f4717b9bf62060a4052678bd679510f343 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:068dc4b8964101c77c1aa706b60665fd314fbc8beecc33132a6ad865892428ae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd81a9a03627e260425f2b25648ef0da2dfeaad5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c4e4fb33546d57f78ed97645d2c3c69f3faa24a1c49a9249a89573a53758603 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ee65fa46165ce5edfed80c873d55047c8feea99 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec77ddf201b10771466c835f2d611520b09321c014880db0a0f2e895c90c6631 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e64190ae8b53272870bad79d2d720404849b83ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dfa2d89db83d2b558c7537f6014a42d5397d0fd5758bc3bf3326ef5f7f6414e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c7a51752bf07ab9e667ea761baf3f286ce3d103 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffbed5c2a792c5e91e3e17fe8797f3d499bfa93ac1792eb71a532902bac2f391 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..140b94589452104aba8746ffeee45b509f59295c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ad7d06aa1449aa741e0d562a10f7a47f112689f1ba2e126c321af6366ee7e00 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d19740e164a160680bf45f517e7a803ef87b2d5e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea7c502aaf929d7668fa1c617a23908b4e90ee1540f2c53c1e706bed1e2914cd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63b2243eaddfbad08eec8dd76544aa75bcb860a7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9b6991ce1d246bcff81d2611148fde37b7e033a42edfba29ec003e9348d7f53 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5ceee4069a64eb8824b6928ddd024740079c6c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33f1461237751b74a4ca88a2523b01a5d94de124a110158c868f681f596c3a55 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..863737a42b1dc35d0d382f7e7a9cb480545780c7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f24d1bd3def1b20b8957cc0903e0479ac82b63638a34935b3d08b0bb73ca30c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba36ddeec3a0ef000413efbd8a1152c493a42e61 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b1f371cbaac96194026d41eb0432c6a78868962ccda314f925e31ba5947f221 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae003ea970c73ec1a9a94b45aab70576c494cf06 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5de1a975b391218ba4e96990811723e98a661b834f0b15f6de9130c71fea447d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0e2c0c4c7f91c44fc1915c35e8a577ef973439e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f26b107ed1af4b72a2d0df2b43bc005478537874d83d09b3205cc9c5a9d6dc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..518e0e1493e160974e59cc8393f70ccdb5f5451d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ece66b1f59806652003c205124c61c54c92a85eed9e8ea14efb4e6ada14ca604 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f1af8269893f50de5f89d3fb199e7b441107ea9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eef6862d95a262d2f666ffc0abb34c5a178df2865346d8bb130e2b4549a47a3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b353ed1f052f50736d126984a8b876e86f99d8dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f6edd92cc3d99f2cdcb82c95293b2c4602fa0d02184b91104dad4bae87c9d3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90bd99b9685fc6c65ae0409672422a72c6e79a68 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:389dd92f83342dc40807992e0e0804beef0a020c2952f374a9526e107c0ab0a7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9044bae455166ba24b2a77df921a001d3cc7cc2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24fc667194ea4c958d987e3174e4c864e0f561c1356c169425cf13c17313bfdf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3405100e865824032f2a453662c45c478afa4ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2e9a1bad33fc3dad7eff2350e03530fd20cdab95c306dcfa02fd5877f5d4720 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8735844945dad5cc19b2751ae44e7ab4b2424482 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:884fe4e50c757fbaea04cafac6d87e810028a6c94bf00b68b6b5e38f397f64fd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc35d6e9651917d980c8b6ad9f94b5340f605a72 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64014b0040ea3a23d0d7378064830fb034e9cc56a9f4cb4d3d0c1d96f72b4833 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec6c8fd9c150af7761c23d7a09d49f6af529279f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b131eee8485c1ff965e171ebbff69f7e3198a34d1fa44798d73cee66ad5f3d7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..698b10733f7686f4c1b8dc2220abd0f91dc18e6a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee6ea7a8d440ded40d36515d3247b673bd9e77a861e31a0988ec7592c877848 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df090f170548db051d6dd24fd05964550fd80091 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:214b1a9b7eb19af61513adde0e57e9ea31050f3d53acf63d4a1f8834d42d9482 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..481916fa9401bb7f52437ad0c402bb8854c9fe5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d977ffb17325ee5664522d2e392203226278f12a5dd83d1acd4ad63a97ad838 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a990f66a22c268c1b75e4e8538dbde2f197ff481 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b9b099cb4563f81c5c7babfe0f6e8e2abf4939d06d937960802688ee4966bb0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..09a9967bcbdb1dc6fab5d8a38dccac136dd4dbf5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34add8903889163d3db3718e219a07398f38623306b2b94a1b7716c671b9631a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f6bf42d70626f6708898b86aecf71947f4a16d0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e4577a751ffc1b2795b0942ce95c3fddbb4412d5899775920c248be450f070e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8c5878023f12df7b927fc2bf2aaa0c7f426176 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:762dc8aece3df5f4202de2e17515ba6b2f3ff62fa55ee8bf478004e99749e77b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07787150d9b36eeb9c9403babdb967807dfeb57c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eca50bcd16d7c10edf6b8257496a7f98ef3a9b00a7d97665ac9ea90a93b44501 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2975c9d640f9af427833675522d412b612c90e8b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3df3ffcad9b03e8ff69b1a1f676729c3207eef453ff16f5e70b7d9893c6272e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97876aa4475c0cbf32fc0259ffa8a74c83b72a3b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a1427cd1c37662dbd62f32de8b597e077d6579e0467eea2f290f56900cdc97f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7da9839d743313f5f5d0ddd27e73b6186b4ee900 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c19d93aa8ca11b855c44b28c96aa3d0c5a7d7ba7c7240f6ef53ccbf22818784 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f1862912abf2bb6b197354e6bed1a3bc3fb763f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae7b18e53cc68b85138f0a10b4a429c9edca34c7e5d878094f9b29478bc632c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b63fdbb90da38add2ee500b7cda310f6c55efcbd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93eafd5bba43860e0f6f104bb6d6a20d80d503c089ac6698f2c1b9c7d0862927 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0594b24497a36de94e858bc156639aac7521402b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93cf47412231dadfd029b03969658193f7e665ad79afdeec16230516b47fa6c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d31c151c7c89939b00b03383f7e39a9cb7bafabf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37425abf539191d88b33d609820869fec469612756ef237545475b426e46fdb0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2adc64a735e2672763ae1f64288e602cd67d6909 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecfc39c8328c7ab56969a7a5961184bf6e15b46a09f5deaec21bddff0199237e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8bc3bd87fc4a09e69d0d9c7fc39baa425554bec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27dc2394425c0e45fbf99ed074c60c995c7c7d85aa545a266739283c2030181d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40c3a78944e415aeebbf232099d5d706e773e449 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5a6823d0b1a8d7c30486439c4410210c01f192c6a54da21531850bf6550f24d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0f5053f9ad5d2093aeed2198e253b6f5f767ad4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d108b4f544a46b7a426e87772a1cdc5abf63647e1ae32b4d3129ac4900595a48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7d55fc7edd5f0867a96f2e5b6f5a992c44b14e7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:098d704359e5cfdb6e29ad99b766c8c1d38c4077692fb19467a626bc18df6eb1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03acb041e5470d30190da80758fc3b7fd3f1c475 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c16712d95676b9b543ca455b52156639299d2f7e027c31856dc66a8e0cb29d33 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63d6bbc565a201f24c163605a46310b5784b9a5e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4612ca15f515bb14030f6d379f896385ac6bd9f60cbf33bd26944a3101476a4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29747f5dc46cf0cff25b2bbdb7f9aab3c95fd754 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a907c2506e6dae1a31710aa62d522039c48345369b9c207c0965a09bb6fc822b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..515722c2f06b17a2e4bae8c9f4d70b5b371ada9a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:656d0ac1d3a1be8e39835f105e857aab3878013ef289fb175481ec678b92204c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48a3ce020dd15fe2c680183be2c7e8a77171ce46 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d670344d20934ca5acdbeae40cabf8d72bb32f8efffe0fda78bd1f592456b5c6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c2e19ddc2c88792420b8669832d4ae35ab2e0fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce656af8900149b8ffe2a54c45b6271b34cf5f4d37e441def9dd1c3959c299e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39e49fae40775cb31e82ba2f5e5bf42d4508a9ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13ca17df64f9e03d709429ea9365b7725b49a1d8865139f42978d6b899ede8ca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f4217e9d1c7128f60ca1d48e77220f6c85d3093 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a3ad2c7c431b85d4bbdb963c672671ed80ed0b0d79083798271a223b7ef2cbf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffd6dbf30921893cafdbaa7df33dce3320e22f18 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:154ccc79a7dae181b567579297bb5fcc6d0af5733cffacc50b1570c8f1570b9b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74a5a949c5eabc4092d90ea9698744ee9fd87280 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a92e49ed6b898e05ec6b6dccf5345a4e1b977429bd7882d4d5dc7455dab6a8a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd70df286a1ff3974a4c172058ae7d737eca6f6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d471eaa4ddfc94e3953735b22b9688e896187c9e95bcf21f523a1cf9ea66090a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6899c98151b1aced73b5c74fbf6b6f1116d9b03b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dfe8d5f732ce35a1c75ab4a3e9e1816e29a63d39ec5430e5f49caca8ca87415 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27b36d452047303503f9d5d009513c6b5cf76a0e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d00dac2ba911621881468474b61de2bf6b164016ba83a23615fec84a37209780 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ede3c01e4397dbe731c5e93720cbdf2175c577b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db96de06ece264cd08be785851dea72b15688a8e0944a0e48be535293bd05e36 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82b4daadb55a2af629ac0a7bb24e94b54a428cfa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b630911e2357d1ac9aac08f42a8f079a5b75846aa1eb8821c603c09b51d3212 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..310c4378296b8c4c38152b7aa842e2a0f9543b2a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05f53cc6b9ad727e106c2c87ea4f928484b118e417d1a5f800803511ad8327ff +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7111db570a6c251357b4eadd81b8e3cf3c08aa5f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b24395301eaea924829c7a530c233fb54e8b843eee673659ac50955ca96f1b9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20144da99fb8318b4dd96b60676d2ff11b677d7b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced4b81631c6b65c42523c67b003fa4e2ca3d6407f6c8a78f0bd8d6c926b147e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..291f66da8f22391f48f196be060e7133deb65b00 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20e65808c46def42f0cc51adcc7f1283667f20fa463a21cdf1fa24081d79805b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..037815afb14044f40892800756ff4f77528c6fd5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:742ee56e3dfa604bb0c48700f6a840d8fd3a027402fb48149e1a8c0bdbffd57f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c78627de3ef2d98a625e9582ae786468f128390 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3791ad15e494c4d2d05bdcd1d1c772f43cf89549b226e2b3d8fd1a5a522334d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..638d306a96b0e3edc6c15ecf825ea254e593e487 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e027ffe56db6a74698f8ec46c54d727dcab0cbf1df28d98024a0bfc5d6b2352 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00d816c609ae1824fdfd001a1d49e17d2a7c766e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78433b9975f0ae064b40660827932678a53ddcf6a0c0f6118d9713a7627a968d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8a81f0c3a72356f241803e580cb74f4d2b3b465 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee06e2be30e7f6419d18de08cd875dd3b01dc49841c40197df07fa71fc980a51 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7006b0bdc296e01563a8ee534c491c17881c51b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f5a318f73c96cae59275d2ad26f090cda4a37cb45125af193d5dfe6575a66e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..863ae90cfc9561a3f51a385fd1b4b5162667704f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb740477ffac12649f6a0334b70db32eac11d7592da59f714034e700d25e473 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..918e10209b97bd12f21d9b15e249057e0206221f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c79e834c19d35f32df43c3b2e8c011d02008517447f356130cce95fa6096f21 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc3b856d6b8db4d588aa705bd6156c1fe93e4d3f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e0e0bb66144fde6eba1029f4a37c33d87181662a4f9f031483428a28f8bd2dd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..031d302694c7c201e0e21ef9b356df68d1556c69 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8c35f0d3ae8676a5cdecdae9fbfb737a85e1290acfbdaf3c242e4362096414d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de41f5eeec969e73d38045033ae55d9bbceb1b02 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:227226c70447fabfda882b5a0ab55fdef65a99aede7e74adaddcf8b3b0973717 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f67626a7e1fa86c7df00ac0df9a563eda6e2c361 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c11fdcfd914a0e3dbfd7acc3d9462858ef22693bafcdb89bd203a3578f2a62b9 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..93a84b7369875ac2c6bd09f7591a930091bcf95a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d88787a25d000db189fe8edf23a6d3ffdb65b215c3a5c5bd613c5750e63c22b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c94ab959c623afcafffcb837dbfe5ebe38c5395 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18cde3cc7243a8ea49f6c9cc2450dfa9c07de5e780c4a76ae023994e62c6b74b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..561c5bd48e2bf0700f12a74c12e62652563b6e63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e274bd9bef04bfdc2d88cf55f12802f59953f1f144cf6d104caf0216e0d2bb7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd82ce86f6489a2106aad2345ef2ec06308e0ca2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4196635473c1187fda8631e18fb61f9aaf27e1116d62b6cd6401b5eb3808be1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7609f5dc839cef86818b91304542a6e1f53ea926 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a65c008a7c599c30fc612ec510319e04b45f75838d46d2f80838306c2f9e2f22 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5950cea3bd8f7309a4c97e95fc4537c142df5366 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ebbba966b3a71f7a9a0ac7a463476bd18d5e0e7ead36670a2a4977b6fa04092 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..93b3b579cc8ef4ffeb00bd658b2ee7db1cc7823e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8155a4ee741944af1b255b799316f05f9c716b64d02bce5569fad3d8934850c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..775c2800f6596f1d86417de874aa6b4bb3184bfc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0b9c8a988a7de573bf6b6ddfac4d6721d6952ecd81ca22f6f9b1bc2fec98d8d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaaafed23b06c428f5832ac2d804101952f363fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c3e1b7631ffdea2c814d87b818c647e2f6f1a4db5a409b5b6790258bf178d0c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a3a191c7916ecf351c282d3de880fb4c0bc477b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee318f79fd2ae80422cef7d2a2da32715a00ef37b20695b71e37ea9251e50939 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7ed8b1a0d2c359f3cb320a96ce867fd0eb73910 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2188f7251b0926ed967adf8c8b07a892cf7b27a7d0e563b604266c17c9af234 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..491a7b134537a317a7fb47cf831e629d8097bbcb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4aa923d16db1a85201a484805edd0f76eaf47e1cc270fa79d2606c0d7a949b4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77e29969f4214b660e830f0f3aac50d6ce45dd85 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7569215a30d2044dc36cbb36fccd1c23aded6e9a7b9e6fdd93e997062ea84bf2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fba09b83df3da53adcaf7e07cd3198166a816971 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbf1b6f550821a71c502977a807ed770b5d8a00a47a5277af3be3e8d000aeb9c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6395e7a1733e38da47a4349abfda9e40d96582cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95613f6103832d4dce3d3d50ff26901c1e19b7f9bd9d03a0edf48927a77e16db +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85f6751fb98ae8003faa1f7616e2d56a9a9bfc1e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90923d0b540b7a787ce34f33dd2e659d78aa54cd3d722050c6b3619a4d9256d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d5467ba3e37498033854634527be3adfe0332c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ec182ce72b639a6536c8101cc7cd0f0faa4690fcc700a38d0a0e9dc7ffa2f67 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3509d4e729b9d56d3d6371e332531621e0198ee1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41ee42d76a0f04ae2a87dd1f66754a12b6c0ecc2d3eede42f675db1bcabd749f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb3b4cc2de252f6ba406929dcdbcd255e958ee32 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bd3a28e1934fab3848877de7382b03f450315fa781bfb670f3a733483f97deb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6620a421737e536ddefa1050e31c0783d67197e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:120b0ee8aa93a63041a69839ea44868d3ab6e521ad2d76b043dc2c1e8720e1b1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4237747dd60fd8e5dd6010f648aa72ca9872008 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:937463ed3249f90f433a35a3d1239fe160f63273ad42fc1adeb29f430de0e74d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..529bd879e3f8b88c22a70362750e33392a0c6d65 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e7038841602f6f38a6ed1e88b733a7b7a7f50f942277347068b26c6a650a7a2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd0f82abf8f56c1518b36b09319205207e178151 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c9d188a8da65b34d090e3bf36973ed56f1f087f155226032ba56bbb18904951 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3a0ab3fb378474530915064cfc6154b7490406b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c667c42b490f6b415cf1f281951ab3faddb8fac013f27ab8dfa5e3eeabd7447 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..596cdab2cf67310c446546c0b87c1c39addec80b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41c7214852d68d8f9f94f7b1a6a0f94cba75ac229c24dc2da3ef082ffbdaa606 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c09e17f314b2efc003e63dbb7734f1a99ce7d8ef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0689769980a8cd3ce2978d02d730974241a87837e7f4ef634666d6953e51c66d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..383ec94219723e4269ed11e2469c9993cb11626a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7d99f922b2952ee740596ccdc87f54f0c9fab85a6f44840131e7c68893544ac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2fcc26144fa2f3c261506f01a61a4b95d151cec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f76e90e612b6ccce6c6bdf567bee7f127d139c885c42d0ffa098e9695af8ce0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7db2f77810d566b8618194c6169d2704bc21cf8c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f27c08b5dae64cc15f4c4283825967d8d290e3d7d61ebae27ea44d27d1dc317 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89a2b211444f565f49acbcbeca9c8f230f8e90ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:607d8188ed38414a3ccb5193087979c972393f732152e09d1b77cdc7a770e6da +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f41d8c00f4d34cca01b0d7cfcbf89c9b0c8a4ee7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de42c7a36daa9c64a68930932267b821ac19a778b89e0444e04b715ad7671215 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea012cabeded34c940f5ec40cbbe14a8d858b1e7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f42476b42cfaa14a21b565db4f22ec8e935ccc42d3c099a9446fa377565806f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa115c5aad56e19c9ee0df8809a8d6f63c8a04df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c635e0b54aae377c7d453c55f4a6c2fd874beab54bface672bbcba24b2c2ed70 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f3a641cbc191c2c3401b4ebcd390c61034b3fb2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9757d08d51aceab155ec8bb30f6e588c7cded254c57e442140c6012398f04ab0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f2ed49478df7f77a95932000c971b3581458a48 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3033f7d5f75ea4cb45c94258f40a6f6565a40f3765fb96f687dfa3d411ec3aea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d27f8b6958a48d29b9ebd1fbee03c48f5e424d7b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61652cbfc535015a720f84fc0e879efec74371913f2c597dd983df1318530717 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7cba41445b181ec0ec3fba0b019b10af5896ee0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d3246d30646c453e382fbee6629e73b993d7bb2fb9f378358fdc49947905c7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a371984d617de5f8fe5b5875ed26a3e99195608 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9485439f2d51e39b0607e786a67bbf2bc9ce240e0f08549975764310a00685b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c373906228de5b69798635167212e023b3d3df77 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6a2a2bd952cfda92da7e683668c880676949278c699a2a566637e030d480878 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2eff468f0f4d887ffc63007a4c09e2f78c6dea9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70b23fd1cbc8ff793910dc24fce95f90a5959073c6144b4b239ea6a5c5edc157 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bf553f04333c50b2e89d49eeb4c48c8c4a23c8d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de29ab2344711f43f24db0bfea8571d6729f0f4ad9246bee3928e4636e5e4e68 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..558b7c0d2279ebef7c6ef1070598adca43a11844 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d2fa8f90d0c38cb26e028d2dda2deccd94ac36f7fdaa86f6b7208c019b47266 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6479a87f27f8c750cb2e727fb5a483ba4933e0cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46543faacd3f2195ec2cd2c5c1568ff74769ae3d63bb6e38a51a312f6b9e04e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ffc1c212215932bebaad5ba6efd17a03bc10f43 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca51e54a968e34168b3b42f29b77137297317792a62cdf348f997db2216078dd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddc1c769c2b99ef0fa4df72bb616dafd0b1bac66 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74c54a620f29cdb0c9e196c0b05a1b1569a0ec5339970ac02742408143b47a58 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a106ea4ae27fe90c14db404053f21b03563c5022 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c2c4eb122404a6098117025338ac1fe9b344919bf8b1e64c8b2cb420a612a9f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6de74b319b11cd72c350879e900a79c40d2d11a4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22afedcaf8e7ee6c3d8a5c626581020ffbfb5821b874a0ea90dc462b2764d7d8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e6a11708cac82850fb10814388938edd25a2647 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03fcc5be69384be633bac2800ac0d615d3ec377f26fd4a00775bdd40dcb38d58 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75cb05df9cf96dfd9097b645a3401295ae64489d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c843aec32587aa776c45567ced9feff28e9e3cc473d8fa62d1b0bd3d3f251f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6629f439eb9a9b88c479f6be6029000d4cb6b66 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9848f839f87743160311115b3a36ffbe70a68b97f709cc0286ddb2c3ab7ef67 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..344d3e21b61c39f841d90b177fde42437128bd07 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cecdc80434de94c30a09e345ccfa3abb5d59a2677d7f1754cdfb9ac636968efa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c3d36c24e4b1826915b74a2a6a4d64edf2df64e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88a339556709f6f5277d6796ce7f52d523ac61b4a7dded93e2d423cd7171cb06 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71d41847ef4c7e4e88e9064bb9040f7949535d75 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb251dd467df8219b4246adb43be2623683257540176d4506e9ea9df55f4894f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb6e007714f9543245eb3aec73552d06b5c61ed1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e8cfd58f6f146bbd60feb468b7d35782692d2a4e62ec91c1e523bdfc0b170f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..41ede181bf5e9ce221249089b497da374965d9b0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:910b5d87d70d8d5eb67fabcd898fc9d81cccfaa6b8975066db6967290aa9ed9a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c744c1fa4316e0d7c83abac1fc497da56badbcd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:591f36d0d49fc6c21c52630c16009caef397e5a35b6472605f8b9425e9e66446 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc6f084b3f63f2daada305b89e5ac10185be6983 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba60408a4ce1100988ed9bab926df814a22882bb8a87d65de66f9a29e5c979ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f41da099be1c6ef90761ef70a0a9abc0b210daa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e2f0cb01614b5e70fcf6e85374831ce4b332c9a5acd9ad518241d347ed24872 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..72e11e2813d1570d6faf338cbb5f4d59b93ee7fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0eaffaa6f56527087f415765b7d4ee0533ee577de7aebca3aae00bc83516979 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b709d8193e6008f46c1aa8d92a9e6354c2084bf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f59bb4142fd72c8bfaa9a90cb3c1aea05a1c73c8c50e21c78a4cf2b9baccf0d9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d35cb3d0ced2504b8e3c60af9a2d63a065b5d5f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:122b94cd50423a58c77114539fc53e19396f8227a5deec887227f198dd45acb5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97284c19fd3e44cca4b41fb8b9da4612941f24ec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f11c5f441ae468de7e367f614cc11903d7903e3c1e97cbaa75df4d69db5cdcc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f37865b3cb7ff50b1cd6a7c170cadc64f1732a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6916c25d53579eeab7c08fc851c313070c04c279c92afb4a32054ee75db56ffc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c48e9c61445a89b5cca6dbc79b77fa758e06bbc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce5391523bb6a622ac1925f693d06de7d1137cc5f41df6aa6c84942ea8a999e0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8248ea9b3eb116a0e92511f21451f47b50a7037d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebcfa6d824efd62146cf97c7e7c5769968e77a897b53d719a0a38d2603a8f10a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe9f00e1053fe61eb8971d866dbd621b3beb0373 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:773078db82d0b3422b2e409fbe9801578fe81a27d23af43f9f619fb42c3ea573 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffb6c99d30e96c0e5c5b3367aa8296b9fe5a2d0b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0117e9bd73efaae0f3043a861dc309ee8539b609cf84470ba6d12b62aa090945 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4416292832484616a34125fa7d4ae237d41f329 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:491a8e106e6b62b380f242802adcb79798a6658e70338e91ea0ad8d9aa564d91 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9af5fd82a8b7709e13cb1f5a4b9ac5f7f84df891 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5499c486d3fd5c613eede45a7376755b7a450c14e0acd221883aae649e7052e8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfa79c51fdfd82fc50b14f4d1b163a358e6f0bf7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:053ebd8f0963876890b0a4b724eac00a7192864b34ebf2413738217666afcb0f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..768907a99d10655dc05051160fff55651483eea9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa477c0d0bff93c80aa3b652244eb0b414b79085db5f4776e9ae63b5e233c986 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65af898aa89125df1adc637d5a8ee021e694ce70 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a60001dce09554b2ac32aaa93332a0a336cf9fae3f86ce5adfa296c1ec48f0b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0ebea5547960bf1123c689c6d4dcc5cddfc08f5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c4ef4d74b0739b1ef72252953c3bab85712d0d43987e660fa0f89e001057cdb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11ecde4169ce3c8e30ad1187c4b7200362d9a1e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167624764be4d4871b072a2e44ffd514922f130aa065b95e9fb1692de0511ff4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..369a07bb8e538bc36de137cf9d57d9357252fe1e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf8f80f53af079cd6b95b61b6590e827ea3429c1e8eb905b75b5ca204b9b33b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c335297b6bd49a9701ec6cefffac66a7bbd008b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ddfb57556fa090388b0d3c361edfc103436b662f2a5795a87d43b4da69035e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..88f53d225cbffb218e2ab4615ccab2ed3cb74579 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cd3f8aa4b0dac13563ffcf8a67c515908252f724ad15def9c49bff538168692 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5555300ab5312bd9fd0e40cd383bef0ae8d31f1c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac8c94cd01bbce66a185c06f4c330ca39e5dd4ea9fdc9cd3653bd9ac4588de60 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..acf9e6fc685726dfcd43c527e44a344f012ad253 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96d8a39265d4fe718778aa6569bbc98c6c08dacbb73fa70df60ceb7e8b49741e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..378e6e5bf2a5d263d146d7a8a46a94bf52f07dc6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70fd7be53161a4c6989a53e571108397f2aa33582900a4109fa3386d5a54dae7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2b07862b5fd03d94504e7c21ea9a5b1a8b19908 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e103ea7a8ee1115038540c18b7a0dc534dc6d89add52afaf616aaefc532398e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..734309af30b4e75aed007af7a09810517561658d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c14c8047b9ed5778347d835d22a926c6334c5346752cd89581fdc88c7b0ad7fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a333e6abb28c42101ec905d2a105f825142eee97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca278bb56341379b868f9be101d33723755bc86b424bc1db551d9af6f5abf684 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3590bd8026bf97845dddcf7823f1a2788d4f1746 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eb3a7b636a418b5b4085f3ed14004c59de4160f7a617152ba2b97059c8a08e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28cea248decc545c60f6e9aacdf40ddab5e5f36f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b015da6a1dfedf9e0dac85bc7b382505188bf7b312a131cd5825d70e8eef79ae +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccfb10fc48bc90e4457fce18c643501e518ae86d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26de0abde4c15c95fb4aab47d2eff42dc007566e6eb02f5cf9ad00072ebc2cf +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..707350e31b87f8063f8274f76f3951272e066ca3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50cb7842e1e842829e02468dd4975c17f5d3aa2ddd56796afc4d7f5b60b3e3ff +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54ac34b6faf7167e977760c33ca99d138d3c7ea9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b6c40de7c765e053a5dc21ad7e317c250b203c340b82aee543f75014f2b4832 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..652f7903d38234226156929348ab756bb8394e3a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdc68d841dc488b4de23db22a61abf4630312bc4fcd7edb05efdcf4d6a59689c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea316de19032a83c1d5bedc84f9df51711738a7b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58ce638983c4f2a86eaa31612b6c527dbde648cc5febce52f0327e34e36aa000 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1171ce93501ba932378528a348ceaf71d69b039 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12379826083ff59fb7f8e723aea8194fbceb14583902516e4f0339292896204e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8567314b8332b6cb953fca812167f5bed09555e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:113c4c85704848bdc75cb1edf2cbd0105f91d5c944c2275de09c138348bd1f8e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b51ec5f18065b7ce520372f31923a63322d0ccb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b91aa3ed82d4fb1d885a09109c85dcbc2ad1e3711d1ce6efea309f6da3154bdc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba50edbc6ecdf0a40034994985051c3504a7a9b2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbeb5e970b3d8f074066e55262404f40a7c0ae579be9a8c271ee27d9d02f124d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96520120b59c45880eb1a50b6a3aa7daceb1bc8a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba918bb216e97a6dd0f7d2d78342120d66069f8ea63bb99c30c21465ecde4978 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc6dc46d3f4c238ebfb34867e08f55576d556d07 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:341697138698fd602a625775eae05b5f6aa86c95b857e7db9e1e91660d382452 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8364a506805f5c03e1691555273c53a2791486ab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:247e332a70370ff36b7dd46817f4412c35168d67ade6e987d1936b94dd3354de +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..073390cb7ff2bee9284a29eb79a0ee1ab6f394a8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:514c7c0575f32763a1af35ed1e20caee138c19113ad23f0b22f2bbfe7fbf8c44 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f061bc97831719e5fecba42380efd55c1eb4f3cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0777f194a96e79b2abf19d2ca83040513d39bc6e7bd8dc37b1a7456dea2bd1a7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71b268e368afaa898ec765bdee3fbee622d72624 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8107da1e4499231a33c7093aad50bb2b416add44805221396b7db8a65e674462 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3e64bc4bece77bb60bee9d3e1def8c4f64bc48e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47ade2fab0209eea320f5641463df1bd8fdd5a0fe01d218db149c400387409fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44a7946b0b762f79dcfb7e308cc6aabb740f8452 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26ce8b0c873e437b6ea6852262428757fcf4a9a53fbf634dd19376f70481fca3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a470bee259c25224bdd175563b3c28bafdaf6c16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf224a42d436d591bf6a65c68a16b7bbc38a28d92d2b7e1a402392ae29e4d6e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b472ec13d056dcdcb7b53bfdfbd3eb32f40abd5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70bfc495f8956038dc5bc3bcbb024dddf8f0c89b126be1d63e6c3b7333e1459a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96b721fd72a983360c084209ef52e1da1317e437 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b3cebf86476c6baccfee3c3bb7b4db60b1dc0fec5fd2eeaa485dc5eeb7f6a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c181d52671985b4133488092f9cd9caba52cb6d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:844539be21336522c7c5f941c3c75246d3a204513a89b8fff18b25db1ba3da72 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..47fcd91a2b0f598b28e414caf9aa9eb72ea93dca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f9ab37c28b728a2749b08524acef146cd5d47742d07ff2d7a23e524467e0152 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a99198cfbe604d9168983217d7fdedb7d9ae5d5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38b285cc7057d64e21ef51b6cc3e97d1ff1a336f7926ed2867aefc798958cdb3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..208ae61132e633220f6a5b21dcb4587252f01137 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:201924c61097f8678c3dd59428de7697a53ee538078272e030e4d7b621d9eb10 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af2e60640db804c92fb6505c8e2c698b6625d1fa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dafc93ef297cd44a49dc20c9600e2460355894d3ff086ca6309ae9e147b4a61a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ef36147bee8e127e592703c880b50e37b6c495e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96706ec8ab0ec81b6b24c339ed00d92fed65c93de938b0c1a48e5bca5221080b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..582d0229c833a06c5523d19f7d9d34b24fc0596b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2096811f378b15b4ccafec134fda26ba6c4cd5173560ae2d9e47dae28408ccf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4fa32af109e3dd4b1770da30280aa835bb11dda --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:713d791a389a1aaaaf40a07a47eada6abf02e2bb2dd01cf311238dff9e2ce313 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d40d902f038fcb32905627eed8376eace34f86a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd29c617ac0f813bec73bb865775794dc59898ec540a96f9c966561d5c6aaddd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ca68e551a67858f9e1b0c1d68d96b466155d989 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cae68428c5495406653bc50aeac2a8b58e6306e49fbc0590df4e7446bb6ec211 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab62f175b9dc338696601d84414f176603809470 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33d0222f8fd938d2c47e1c94af9ee87abffeadc0e2a27138569d79e2d4ed40c2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de1ddcb96e68f4b075c424756e6c69e3cc9be0f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a298c86353a67f294a374803b2ecfd0798c2caf46676d6656fa63d7fbfa435c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ed39083baf46432d8f851e19d99b4eb2a476e76 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f39419c1bae644952fc07924dcbbe2ea2eecab1e5395372b67dafd4d779626f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63f6bfc1bdde08209c008a639c63abe4ab3cb782 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9914bcf66e28111706c49dbd1dcca10d5c8d98fa8665704cb83b9cb17c25e7f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83b6741611d35d65c2d0e663650cb814ddabb3ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29b69593197d4a530e82db4edbc53964213a7ac0bcebb44bb1aa06839e7d3cfc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b021962047787c12a536ab2cc9468ca10936456 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5b895809a45e5ef523c73ed88e671646b3fbd36ff4672f39622b88cbe59c809 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e201acebaf981f41bf810bb2c6c2f44e4b41ac3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d252fb28ed30f65cd7ca34145da9ab347e26f811c0743345e56d11ac260e4b8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba992bd1fb9a5ae04dc89dbb50e68aa262eea931 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21627e95365581d0623cf4d33ed5031f2915bb2dcccbbf8a1a79cf6c64467b19 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d019887994cf419115d478d33ec3e1a9d29f0dcf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:957b5a4f1b71ae3e2a182e9eef9595909786388115bfa0378a65ff6079aa2b52 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4da619af30be9b495e2b787063c2e100efc5f49f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cdbe189b0e199ca6ee776f56033fc4811617b191915b8bbe0c5fece5e989219 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aade008ca5a1509e4f3534950b357eba8de41f92 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a6a3e07b8220916fdf0c6154652dca4b244f79df9a8507aee62ca47089b93e8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..98b6f189874d5388b14b79717fba9b09a5df8c5d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b643f8501c44b92889356b3122612d94fdfcb19ce80d2461a30834b74f20384b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6b095bb3e83bfefa6aa760672d52cefcc79c391 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4f2ef82f532542f74afe123d8dd843a8f4a662c92b073e60728ac17b6b022af +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..95f2fecfd87d21d0f5fddb1bfde55cddfdc7f023 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:314e2bb77b14e1a38cc1121c4a4707235ec5b6b0a3aff7880f59ff3e444ec4f3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f08f466aba6d292387f30aa86ac2e95b1cf5a79 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ca16970336403b54385321f43db5a84671dff077828a8d581c1a9088321b4e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31bc2c94b6ae7ee963c3ba03d0c7e8eeea9c09fa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a66db309451796f4df948fbdcce575f4aa07d22846e750ae56b172496b38459 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6980039042c5b9cfcf518dfa7314a71340502ce2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f0291b74b8943a38184fe0ba48edf65ada62e34e76e8a045379b4bbe8bc4965 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3a03273cc53958d4973c835ca461ecedac3db70 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16e19bca98bc2420881bfec2421da8ea29421ca21fb58fcd8bfb30da6d115c54 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbf1e9fff3ba6c73cc8b1fa3a946f6f27bad1ec1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b4ba9a36359b478bb4b15036f12aea937ed065e8fc2a452e5cae30422adfea4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be146eb104da3674cc5770b1ae1295d35a24fb71 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:862b3beff71d57e7389f4307fdafadd38b3743cbf510d466188fefb186d78c38 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc070a38ec07c2bcd655c3208b74b81cd52b2d6e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebf9b25f650cfeb6090ab3b77dd8e4fadfff4ec3fce0bf80113aab572e777753 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..80e0889d1650256aaa3bc45f4f760a430c58a8bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ce3ce235e6ede588efc36df65c1463d2255dba67fea7ba2731967d0d34473a3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71b9b2cdbe082fdca2c5f3c58b9531e42b7fa0f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:773d2a675c7367bb8a7a2ce8a5078e95b311e713e24550f946968ac854a4f363 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b68f15c3b25710b28ab49c89334f74e33e11a573 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d3675cb78d15d1446c005f100189388b22f9c762be799d62ab538a24b3d9a1d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..497d93478f08b06f5e6eae78284c792a15c73c61 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4c80ffa6b45fbbfb36e9512320ac44ea909c41521d08bf34b97793c9fac1a84 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ca41678161c531208b56e4fd351e90d1269e6b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5a47677fc111dba8e5d9278c8b9b528b757e2161b882aa3729950b7b7786e84 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2ea655233ebf56f62544fc2f02c55d864f6faf1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a42823922416996867f2cb6cfedd2d7e7196a0ae9a09cdee8064331ce7fecb72 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae5cd1df1d0489369a6517d6502c24fd1ee34535 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d86d988df38eb8150c343c87246d9573c634c4c318c0743ad731195d6c6c47d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..090d3fb1a104ef4a19579fdff8abd930eae24502 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ae0af79205cd60b8c19132d35b45edb8686529e30affd31d35099f7dab79c91 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6163e0acdc4d7aeeb19c101c167871b151dec3d9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2b53fcbfca35ea670f89b798e5d084f0810e1f0d41ee98833ed290a5eeefe06 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c987cb95068ffd721d67d797dfdaeded167c613 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:835652c0aace64ac87cc0ceaa7d8cb054df96786fe9ab992081e8778d0c0c402 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0629f4d74238dbb3cd10ebfcd3d821c71c67cbe1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cde5583ac5cfb8a49459a606f005abb12fba9367c524b0e45a1d0855b4d0bdf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9a2274b4f4596cacf00b07b36407359f4ff2f8e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:325cadfd2d136c3509eee21ed21e84c7fbb715af8d5838f404d039340a72e3ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0d8885e4c6381255a67f662725365a9d6c3ca60 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:187f6299634bd7c480444722391a63a78ccf31f1e56090e13abc3bc514f18b9e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccb4407e01c8cdd0035b20e0da9b1231d4f87e3f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:203f502c285b193b14f8f1de91e6d0f293a98eaa7bd5fe2a145cd61870ede291 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a412f6e973a8207a414965227aa6a549f316227 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff9cb16acc5c38b58c973116bf9c4e6e38feaa0e6bcac971ef727bdc6a8596cc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73bf040bd932ba203ae0cee895d7ebad1b0f1569 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b46e8177ede20e6762a72fbb1a7fbaaac708a45bd5fe385c0714d47dca100610 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e984bf7270d636f970d19325bde21780ca075da7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83bed8d8add2e1678f6743d4fa56ba0d43b9385b5acd6e64679623c3c4f543bc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..318e7babd0edb22c84aa4e082bc791147f09807f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6d0ee689c5243e158d11b9a116ddf5b70bf051d348332307b56a11332ba64f0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..606b6af975ea9128851fefdd40d6de551de8a1bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:962c5e3b05f81a750af8af28a53606f546695980c38dfde5206b027e42e58cc4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11204a68c39f112a592558a121d9c378e9ba0d5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03575a947328c3431782d1e4ba849eb042415db5401e0d1d99680b48c191fc9b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cd23764de5a6f6588d41226f5b4db88822b5f06 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c20f1b875587e4eafbf99c21bf94313be8ffc181b415ee2cefaf28b05699128 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fec82de07b8984314c310ab5481030747bf20b48 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc96c4fedba93d27fcf36b0aee7f99f8e1f7a860294b4bfdf5ed9b4075a84eea +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1135245a3d5bc074c5691ae134b10450d956c10c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:523c0ecf2fc34369c74a5f184247feea46679e3b7b02d894ba942c9c4549bb75 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2231bf0a3cfd2293c86ee009bd9b806b62414046 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b9e9aaeabffd39c765f64b2abe40e884a43e722ecae4e8bed368319797395ae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9907173e9646622d5313ab996db6ef9f21852528 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3842cf7f2ff9aa53b0c6adaa1c0a8c57dbf9c6368fb7ad905c7a92a606aa0609 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63dec48bc3ea52dd8ed129538e35831fec768575 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f7ee904286030bd74de72c8f3fae684f29aea1d860e40af2e361b4bfc31877d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f420b167d4f7e61b991260ac93af5e1ffcf6903f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf91510a8f3f222399537020d95df2446e64ed23de2db6ed97bb31a3ba8d434e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70ade26814f1e8b80e28fd2411eb43dfdc084285 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a193cfc57dd434a29fc0fa4dd1dace13114345994968bc436d7e7a318c4c539 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2981a0c52bdad89039642dd584351b047d71efb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8adc5dcf3f23750fcc3bd1e1c79fcfca90f4a064f1e48da8b886fa2f5b187eb2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aecf7c5f40f40932aa1f7933ea9d2853ee318883 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d463ed3fa1a67277a7e7cb6c3f300c0f533d9ebc694f51520ce7eee67ab5eb07 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f50b04ee47eefa880b86a464405f67b711f3678b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b542edcb55227823144229749f5355af2e0b10073a2ef56c2d72780b053f629 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63aabc21b2cbdf9a457432f649a5275ca69bbade --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2195b7c730930925cb52d3f52b35d5b79811417e6f85ae18de1f1db5e1fec64 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..693de8831e65bda355074284180811ff7d04f1e4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a60d4323d4a4de40de643470876e2376ed3bfacd29d7d1bab5cb1530b49c3a4d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..890fd62eb05f6be34ff5a993d025d9ef274ac978 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:968ab6c8f33e1e8fdbe9dc7c88c732861fad6baa6c12fd5260d6d3483e5a9a8d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b45d809119a96c9b62cfeaf9f59cc0f08e9c573e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8f7812740a8b606f5be2e1e4ee0225abc549dc92637448cadc5d43edbd1ca51 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d343fcc5a47e19b938979de23a7cb0ac2a753eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7731dbb64722b8ef2e45d91997972f004b36d407e31e97e16f120b28cd0c6c31 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f062fa4fca48451e4068c709196feadb124d1480 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f6c24a43567fc579f56c30484cfe00383ddf1001183a143e0af70a45224dcc3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecd2c39d26bf3608f3268be6dbbd88b667d6123e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc3fffd54ac01dbde07927bd36e2a95ac49fe663e73b5bf8639fe5073d2e5a1b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e0bbf1a0e6dac21a882810d617fd7e40189241a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9939b45b32f3a01519bde9d921c5c4d490ddc9db7dbf6a03173e974caa0ad7f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39ff9aac2dc2dab897df1c1d3b3dc38f0538169a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:111869a7e73e7f59b6ca913f4380f79cf47904819a335a3d4b5a8882e9654ad3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a87040093097ca444dbb50f6c3f896382bddb12c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e964ea47c067658c04ac1353410f7281918552f63faa218a9c72d0dfdb3fd6f9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df9ef5c4b26e5150872c2a40d0c8b9cefad2199e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c4abba421a1c3a8e7050089f2e4cb584416e2da1d88f54826b695c1e8a643d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..65e6d65ca1bae1c68de2a0b01bf36494a55d357d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bd5f361ec70353727a38dba5c6dc45fedad806585e9e3845ea0f67c54ae81d5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eac171762d03e26d75ec0c485aa8e65f787a9d8b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef69ce70512ea8a6bdfbaff0c0f0103986d2b1d0e09dd550b53adbe4df555d35 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5349d0a37c11a9945cbed7e53d71d99ff28881fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7e725062921bc1ab25365114152033ad04654ba1d5988d4227fc0e9384957da +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb299a57d5242cdbdde9d040edac05660ec3ddd8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bffd3c6089e02bd2e212ca2a9d44f2db81e4697d7e8651a1d2cb7b32168cf18 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08f168cba150c7df8403c9cb751e47a775de367b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:672947a80009852a878a0db0a7ee912f99576d4ca9e2ebc6a8fc83740bb9c518 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21daed5e9a9d7f2410baa28ebc7fd260d6ced5ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9602079b8fa03077d52d090f8466ac9f43cca9a04cabc08790d06dba01527a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..461cf43be831e109acca25bb39c6b1fe36a6f351 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:059fbf844693c239583c43c81d115a9c35bbbb194167dadf48b599eb39277d67 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c231375e122d53dd87a055ea45541fcc522987fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e95f5df39225101b710a557dde933db9a802e1f89f55d9ebaac6e0b7ee61f08 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e16043b4b716e24505b8d4026611a74a3cb56af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce25e46a50f0d24ad481f94b92e6f45abfd3be1c1a15c49c1057672eb6d892e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdc5cb9d3b2270465942303a2602cebf1e5bc091 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59f7178280da03f648b100edfa0e3c55e3691995393fca2191debc4fdfa6fe8c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53e48fdfc2f4312fdb2c3cf786152b4d98c0758a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:448608e98c5b3f9535eb6bd1c3423bb4908a04d28bd49672f27167965d13fd86 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dc31732feb510306eacd8cd78ed1434b2fb3af5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e4a6985597fa72f5fd531cbbfd93b2310b5da670eb887740625868f58dfe64e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75137217856489d2b67c586e60fc2c0983f7d5fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d307a628c6a5d12df43a6de889c61f4e3b006dcc8edb9213e010bf8e57e0a74a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4181d607840c745acfdf373fcc4671fe1d4c94c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b22724868d993a00a70f7b615190c32c2c8b89287d10e43e7f75c8ffb423d159 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b4797da2871db0a9d153c945b83a6d65fd5d15c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:323fa33474c7e2fbb7a907580601944420efbe7ddcfe669aa3d4a09460e539b9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61c8c61775f507e6337e6583dbbd33c1aad5c7d0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38ee38a573426432494e098e82dfaee67e738d64590cc40a5459f96da5d261fa +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..418c4e9bf303664c690a23c4c291c67f56b271ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d969f4ff361438a99592cf94c35454832c74e3119ca258cad023fe11f523ed6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86dd581f874190e18eb5eab452daa864ce37d065 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c1c21887fb25706175652fe7f0f2090e1ca7cdcf5c3ca0841e0983eb5fe3db8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccbcd8a9d3674a897ab00b519ffe4c2c8fc3c392 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4824a88602dbcec3f4c426b580414cdf76c8fb8b9df3a786915fcd8e1434e291 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..051be9571d0df15862b25fb0e53e81a685c2c75d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:436e6309dcbc32504dcdde49735c469ca55c5c87050c044fa1f873e84d918dd9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..303d8c0b30cbcb21fe04a977e422dc0f29484b85 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fab9cac884f7be1b87ff4585ebec450f9673b90acfa9ea6dd2c41fc3814ba06 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60230230783a9811f619ba87169d89b3c29427f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f746d741250fb991b2459fee54bee0d29ea2cf621c7247de3968f887986de45b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27f5e843aaef86bc5086b27d11678dabe0922718 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3da45b7ef86c24dc3c7f74f3dd8a7222b8166a1282bb9898a618d056aa088313 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db1f98cc18a870efab67602d05e64a3507742226 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa082e818acad2aa9f34be0147b355e87e0cfc3a65c2695064e6fe00abe39c2d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9113db66a6d10571e0bef891b8124420be7e7230 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6771244fc3c023abc6c60735e8ddfa403d29013671a4ff4e37eacef93b030fe6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4d5bf18b8bf5f1dc15973411bde5fc7053d3e99 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c9c00c5f7c3b957a2a0bab04b6cc8ff6069745652167ca9f092395778525222 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..60ae7f620a50270e9beb7e6c9aa4ef48b71504d5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:474b70257083241cd28158c13e3197c0ad28a24252dfaa73a5964b1da7a6a9b9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b10c85c258ab04ce3ee761abe1b1f681d54524f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1e6c843aaf4d0c5536d0738711336169c5dd8a9101cff79754d6c5deca57253 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46783616cb12f3d6f48f96939b7f55de5da0d4fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0221eb7268a25d4f1268d12ac24e92be41314ff004f387234f58f8b3883947cf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75a0c40d8d6fbd0d39d32d8f39d78021f5edaa88 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a81b2d9970cf8735f5853155916fcd51627c6885180e5cdb810eefd9158e34f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..604f5bdaa180e1bf4bc9f827b53f959d4e19e7f7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2564756c8b728af7b43d24e62e6a13507a99ad972882fb9cd15446861f06f54 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..212cdf23faca9366d1d23df8c5cf390b339037c1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3d020e9357163fd7cc82b900148c3b6a2fd30271dfaaa17e9761fb7701468b0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..708f3388c48eacb730d7e5a0b85132a2d68ed2d0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e36e50cab79282e5f93334239ac33a02b8d6cdf53ff2d22f71f40ad4816465f0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2b8a87384651dc1ba0f3c5b3c928a102b13fbd6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cbd26badb97f02bcb4bd4c9dc5e63dd69c70acd1b001d9a3d019f92041bd5d6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..65f183448a6e50f344661363e708ebbf3ad9ff80 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:074d1a152a94b1091923dfd2e1a32d20ac81f1e6037b74cbeab6bfeb6015fbcc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b92ae48e945e6541410b75fd24ff146e2fbe29bc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0590ca141c5b7a53826b149fbdc1166173052d93b02e43029cd2ccbc787978f2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..428facd6a18c127656d77771cc62e3e16588b013 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98db45c6a3db809b6416b58682a79d561c809658ab0de96943fd28bf480168a6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf9d93582a16b04e97764b834d7af30837cb62ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d16c985d09b269e843f03e21bdfeba0c28fce39460b914ebc883b14b6a7a36d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be23c30e9c53e84ca3a64cbea034ad5760c57b73 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7b1b0e1fbce10c357494c2b896f8ff19b8f7c33cae45d562f275f98dda36ae1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..095fc1b371fb7d0448ab4ba9e87647ad7c580cd1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1166b4d5bc0d1ac80e79e9c0d99099f21711794583144dfb5c53088414c9d94d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..81d196c805fbae2ba985a91fa7812b22899d90ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a73ef1730abf54e914f34291139bf9f7055659d51015b6beeac41d8b56c250d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a900822600ca78856e2e7d758750307b1196f241 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60c1bc5e538efeff18e401659e9e9705511a797f93e097216994c7eb812edf7e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3cd2510b0bbe4cef85a0ede36b78a11dc2fdff4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf927844809f90267b80b378045dedd2c76c1d6d7a29a36cb8eeacd778602616 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbb05f480cf867a6cd8efe6102b74a5985c3e743 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:511199a262c325e41f59b70e39bc404dd234566a0fa10ae5e38f586ee8fe6b5d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..23f836a91366a181b3747d59bd668969599d838b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16767cb1c5885084053978b01c75f3a43010b0c44ab3a94a4f5c808fe3ceeca1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5617ff60d335e55acd2132fd7cb3ffc8a02749fa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fe5bc969a6e12abd974be92721fbca6078ea2bae13f90f1920f659a8cb26535 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f56edb5c8a0ac2107bc61a2f1a6efcc31fc2bc57 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f982a9da354c5c39bb528bfde096f09d8f496004641b5514c9ce7abce36e870 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01527f00b9a80c5ac2df4bfebcf6e49af2a47d97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0edc14d44eb3162160513bb19769d27cbced88a2f834e822168422e3aa6e6b24 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ab775083d71ded15a2cd19ef996377086022511 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a229f1b116b499b113bf075c41be9e17c69147a68dc2bc821062783706223726 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ab7afd33ac601c33e06ce74f163360779996da7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57c2be8bcf2b88fef80de8336f3ab46382850caf6762f5846e5a7426de0ca70a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c88183c8801392a39d7fb501d8d2acf32cc90e02 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e38e32de090aa19f759777b25d6cad7adedf72a10d52571e77d98c3842d51265 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..121091ae67022fed84e2009327e19624304b7110 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c138c68ef5d367fac3cdea8842f6ab0ecc049b79d1494e2de80630b2b35a866d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa14632b25149c59c92d5fa9bc6eed79bcdaf7cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b74b75c983112f882509db376d670cdfb1146579a195fef7794280a7fc85d083 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48b69dab4ae743be2dba52e44f38d715ee0ee8d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b90455fde716b36c53cbc87b91d85e542f613acd4695659e4c7a1d1fc676fbe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3956ea724cd3ee6d89ed895b532270e182ab56d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c220279329f202812f2137478110973a89141901f61b64719a67dc979e46d15e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..195be0bc0784471f6cf380223b0f590a86a5a28c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98cd5832c0e0dd3976ca07f11a3e3a86d79b470da250acbcd8fac629a9c54236 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..47f614470a3558e4063bbf8eece245574f5b408a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b1cc13f7a4ad24019a963c472de418d4ec5b56ba60e2f08503823e230f78cd6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b8c15451c975194c899021236a1b8707823f80b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44a5ac4261f6e194a61b2f0330d76e4af7170ddd1a04581a6d89dbb423078762 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..95b30170249ce8913d30eb45be9e33f128d7d5af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8024dba70aa302b347832890445bfaf1b739518c4e2e4d2c4d4493abc12f2a8a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4301f87e39edb83ffd07c48e14f0f58fd2a4a67b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:058cb3623496bfd064e5d1c58ef899c18cac5bc75b40f97a177f2ede3956d2dd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc546834cb8c0d1bd79c2e0df990012c79dcc378 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0c384a2afe06008879c492423e7906696c6050d7185ed4096b44f1f5d1a9359 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e49767f30dda06a5dbbd0e345fcd52426c75ae6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6ab9bc03adac0fa38ffcbe829f46f91a9a65350f4f05ed42f7cd3a792524f50 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..448d998361fc5c800007719c30e11edc1b24f9fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e09c0eaa783d7a58798c8975303020ebef1a3192a80d73c65d491b8dc076af4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1143a6584d9838a0106be89e14b7dcff5ed34d4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2a72d28ec8f46b036b2bb532140bc2079fc1bbf6a6de96c09f60e312a993ce4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9238d23ed2dc32c7997dc92702e4db620e63d7ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:852ab55e7be7d55162e6241680e48e244ba507abfcbc316acc0da2341e203b6a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aa9f4751a4ffc2f462ee44257caa7a3ebdefa31 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff1760472f0b44f2f3b8c96d2b498b538bab6ec8a6d76448898f0d3daed26958 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c95eefb19e0b3273fd2ed3622f08088afcbeb56b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4501d267465fb5a510ac4d5f98809293b641ab6d36ecfbea08ef6de0874fe24 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a593e9cb3732859a315a53beaf023e371cc99fa8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3d6595406b07512b37821fd7d704b7b90199a645450de7995a142b8660c9e65 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a2fa0b580582aab5619f333fa134e45a41111a7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7d8467d62089f6a70a172658313dbaafa0c9d4c72f9131f14bfc52ebd062783 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a745896a4604b1054ea16fd12e6c696bf656d773 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e6bf3d2f3104ee88a630aa31607031d94cc3c9c3c73e55253ff701eb71c9eb5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..943e28056de042fda8a2358521aed502506e6e1f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:053d7fa5a5034dec0e2d8882ec47afca01cae79dc0ace2750c0d94210a0c5b2a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c55cf237cd28d8e74020456605aa550fcc7a8dbd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9159e3ff0206daf40ba18d1fcb1710b9f1d2ac69957128044e93fe35c1add9cd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..417dff2e0a2db28bcd7da04920d12c5597881f41 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:195b9b7dfed18c89596f008209a5e912be6013efed7185bdedcbe364dfd80003 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f137eb748466e97417f50db49d239f1c765ef9a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b37f3d38595f233dec383eb5cd4fb604d411d20c8e32eb7689387dc871c22589 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f902f9bd75d2bd34578c490ca8b2e48df6612557 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea109cd63ed550cf3333c8273069490ce4e70a6a82076c83038fb24e93944d1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abcf3bd99e229f6af17f5db81dcab997a8b10e01 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97a2928e360143e764fd570e0408d821ab65a5dfc215c11d2847feedec31502d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55244bcf67bb1bbded374589ab4d9293a4e46922 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2de588e8f1d17666a1ea59b4918f34c2a6260b7c83932247c38cdabc4d04591 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb0cb216d4700f1f5e9e8b6efa8a5f757cfd552c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d54320366e0a44479d5df1226924a143e3b55bc4812e977ca269ab60e06bc7c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..88ae8789103439171c175e11fa9c78c9354cff26 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8f0875e39b85f22324d719e888283535a9168ff1560e959a4f4d286c98d4075 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e71f6fef867bae006f4851bfe7c3981fba5567b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7bf5f80e7f54c10f962af07bf888b08f61abb8168661b993cfba94a60b3fed0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a069da7179f15a52c8a563b01a5083e42c5d70b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68e0fcae9c05ad0edcf30b2a739f848ed164dd9daa09c48c4b3fb57dc2134358 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8767cb94dc47b9ff0d6121fccf2d89e16ca82d03 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:650b0a56f9a42ece48f1d32c4d9ed1eb42f162e97722ac6c7392b0f00383b6ae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cf5bdbc43361e8a20fe86724610a348dad57bb1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebd666c2460da92dfea12c2a4f9e585b4d480c7d0deef8838540463c6d4d54b8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7473e343eda4ef608adac1576f563fc833d70490 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aa897d574d0c919dda709a5105339046f84302fdc51b9f60589ea8a2f42f69b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0ff4e6a1284033d1694a83873c8d4467486d238 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40382aae4a21e5622bc9f501a537223de6e3a3fc1fd2eef78871bbd3f1d95ba9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8a3b229dc1c881a95ce6c30d4e5e50e61a2f509 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc928371b9f5f00e4cebc00b8e8b970f1f4013d0ed43f15a8493232ff159672f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf456768cd65963188896bba22e3d5bb3e502884 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32037aba33fccf8d7cf50338c22a8a2ae48cba1e17b60632cb3c599e55c8d7a2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69b9a72407619e397bca6841a376273fdd9b08cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1152de611d5c4508000c673a0d9b127985d65166605729f068ace88e2bcf1d1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4d892541d041dc66fd1949e61e235d223c5c573 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5a82022f60d017f70da97655d89d0d5c37b3856c0f58f66523d8102ea1b5f3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbff34e064c298f065e3591f9eb8cb42e6746cf5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e817a3f69902fd30412bf49376334c47c611ff7ce9267196c3101777d9a6d9b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef28c9ec0ccbd690ab03b8e18b337f53e9421935 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccdfaf1420b53dd16eac566c72e93fb3b7392b1e6cff01a7fef4fe0a67c002d6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62b17936f32ea11e190ffd0393b87ba1dae6578c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50db934fafb0ecb05eaaf7ac97da3d3952325daa900a6b778b9e87a94958ecb0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..885a34902abef7487d3b453f015e379aff1c61eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78938270467e75e945145d8ce1ab2234ff4ceb92d96164db1decce2442be8b2e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad72ac89d25454c6edc6d6ec492800645766114b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a4bf80b3f966ccf04132b32c66ef4bc9c30ac095877559fc8df68fc2db8465 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6618a404106abdd908648a41a42b44733179bb51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ed6b25099301e063d9debb709dea06904f4fed9aacc30d6e3de76f8eb4bed91 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e9096bf7e720c08d1407c8576c8d271bdbad5a8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:334953fbebeae434e6cfa36dec1654be49ca209bc961cb106992077f6b0fee2d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..05a1cff9b7fb38aeb212753a2e794382a6a2e360 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2e718844b31e834d68e250a23a17d9847db2eaad466602ae8d46b6e7ded2706 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c5e66c0c9dac57daa9f4509917fe0124654af01 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3118bfb28a69bc7cdd38634212d86360ad22b16f7895bf6ead255fc99b0f1bdf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d83b53b215abd093e8efdaaa779dc6d27bbd8086 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5674eb81d145ac923ee8c53196b690099adc537305cc79a5feb56e261027a587 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07866cf04cfb40cc4b4961e9d4b3338766e7e9b9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a0a001d1c0454a6b42f561a31e29560670d874234f50ba1b27132f1d7ceb2c7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b58ac4ffeca30f72aad198b00b5c0b3fa7dae70e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2d466f78cdda97be8e90d5cc37cacfb2f45087cc7366e84be793a0400d05f24 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c96852c1c877ce810f4c79188a0b4226489ca249 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3cb5e2c1cd9053765c20f65e99a2815dbfb57468e49a60e160e51cfccdaa471 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..697904814ed754410316e8b270b7375131ee026f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e83511aa63de3525cb19349ab604d03f7e963b4ddac53089bface19020b3ed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..386b09e2eda429ac7012216764713b7d868ed3ec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7da7549aa14bf2eace2d8b9ee712e3d7ace8f7d944c05010f08bdc72f161a28d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2203caf8316e3a3747e556c4fb0de2c7ca834676 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52eeaed0d6dcbec890fdd09dbcf5c6c3bc41baffab0b181f929a91de7b283769 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f80f4a9944981ed2a1785e94cd0096bf23eed9af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26b1b0e32d4889f2385cad0370aa4fdffa232757dd7a2bc2ea5e48e905d05e14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f670e38975bf4a651da068d6a46b636981a2dfe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1a28726e8643971d41063ebe748655fd8b8ca72b0662a54ecb71b52308fa3da +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df2ce4089d4d957371b7499a5ec4fc65c86a1cb1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ca817924096420520bc30cef950b9fbb97f93330f5441bb3dabaaed9c74dc59 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4499b7022eaa32d328585a1cc123bd8a6e3bfc02 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f077ca5a29aceae66033f387e4808e4361d0a13f72b8ddc00efcd8d1427fb8b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12597b89c95facee730d728b09016c28880d6594 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca718748ac354b06ded4a80ef5d9ec8e3670be973d8c49d9c5091d6e4b58890 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfe11af0b5d491da5844a06a64cfa79839db9eac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7a1ffdf69914ec908b312d9f8042cb75d7f63b1cf1f78688d46d735d01b064b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e2316f7fa27888131f691ed1a35d81ccf488c9a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15976d51da533da2c43e44381de24d5a5f615222e95fde85221aead57e2132ca +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebdee64a2f0f56b8645103c8ecfc51e629acc9be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b7877455413596d5cabf9d7dd3ab061101c5713d18d2cbb97bfde381efd9e1f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4723727a18be7e07c6e272453ef7e3e305c16f27 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb6ad2afd7a3a2d5b44e6aa9d581bdc9709a2beb7da24ed6da742aa9347c65c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cc38aca8feeef5b166c1e65d93c3db485eb51f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ff61104b563bfd336ed388b3641f47222d04cb5bb60ce2373112d7f711b50f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f96af40a39085c5d821dc78baebf34079b9badb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85df4778cf45c17d21948736c21b0969eb7329e76e39df9a0d6840d946c6631a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d667fef88c64405e2863c0af1c59ff76eb2b0df3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8fbae648d9e11146cf5eafd5a7ee20428494b380ac49e89a53cd9d74b77ec3c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdc7e79c272bc4f59d2bfba96f9901f871603dcb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e10313f884960e348239ad5283a84ea0d9e184ca5013cf1c8fcbaed12bab9918 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96d7ba7a3645ab7a4789bcb1bbd90cd87c0f4d6c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7852d7ddffa571c73e07420c122465fe4b0e2b6c2db7d10daa62af3be216ccb2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c07593e7145bebb06d9ac32abe627e1bd121c04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b5fe5e1d44e28ea7c64ebf71a4367b55f4fac579fadc0631e5b7e8afefa95e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b0457d00caf40aa5f5c89c2eaa3417b64d0d5db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd56911ba26c63800af068c13060c827a9a733bcd68fc6962c0ad3573bb4666 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..971871e34231ed81ba66e831892d714503283316 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e4209800a9baf746aed929a34fdb60877797a0e34a46dece4f9b2fdc5c5ef6a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ef51cc97d7c3c59672c327cddec441ffa93a563 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dba0e242db48ff5d6595f652ff926169afd089f1d8c8b0e4c94df18857e065cb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95af866afbfdd51e269497b086bf025957887a6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d5f34a52940d948a485b65a572c6e273b789412808ac6d3715199cb3591fb02 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..915966204b9a0fe76a3ef260ec9455b4262cf324 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ac473511cfd159c2b7eb9052f2d317ec9e4d59b1ad09c490f9f402ecbef06d6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6de849e7630634a4a2038d5348a8e2cca407b6e3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04464e4e4611511bc7d0e00ddb8654ebf3022d77fb6eda1024c6878bd463160c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bc207bb3edf9b2e95913e48bb286b333c017dda --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6f891b733533d359a156f80f546b14f4a1cd1f497b477e2573153eb74b657da +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93e6d7c2db903cc5e2df8d0c6ef7ff1d2a5cab29 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21ade375b161c14b3573e7a35ba16d3a9d62abfba394a0f0c12f732f5948e463 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa78238c1686e4e15bb056511115347bc251c48f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a953b1ec063591d55ede3ab47dbff6c7b780c83f64248d2f24487a3a8feeceb4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af412d7ff307f35b3e1008bdfbcd909aeda40f89 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af4cf41e49037645ca4f4d63ec41b0bb8f16f528a02e19bef0e77e840f8b7fee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5326f11e981675313caa30d9e7b2f35b12151436 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5725d78a5a30fef2478b4584625e098be9a82245535510f4db05cc932907020f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2a3e2f1baa5e4a990c7e053e3c128efaf64d58d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:217c81db4813a4904b5bd2f306983214f8a8adf8b12b6dd4c8d2d847c83b513f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae16099d4f3ffc2014b51ac27bdda6d1fe378d6e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdec41fdba6bf886cc9b990d2be779e02871589e27e368acec4e34d33aa48c0b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..105115293aeb769f725ff8f5ab363d951b9f8f1a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d94b785c31024b39d4c1e328274852637f5942187e3fc8371d19915f96a3a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6004de915bfb01d72ff9f3104eceb2eb4a8ddbd3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:602a88692aa363de5ef050199977bc9ca53affaf65b52e3ea0b9c38944ec76b9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..305e39ae78172d77f0de3f91601552dcf24b04d6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa4d0fabe3e173fcf57236122dcac2d8adad8471175118c10fa8b236264a998c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..882edbe961efb7f0fde53eed4a7211b586e14d11 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acf863062c5999f15d007ee3f8d969bd8866954ef4fc748fe7edd4f34fd39a24 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebfbca8af5c58c1de8e61f5532da962161881536 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1225735ca66ab4a9e877872749e5d00906cca5404a87c8be2805e8cef79de654 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2e000fa84e01f4644e9c0bcd641d5a305c4f6da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f772bb834b364b2f59777ae78966a0d0ed6eb93a267fb072c91838d673db751a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40abc79399e0b3948f8db81cfd7502d22b2e7ea2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b27ebeb28e54d65db62c8b458cc5c6e8facfd857aa8e3f3411e42794722ef424 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cd02ebb6169c9db4b7fc5587435fa9c38b315de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd6c009f04e2cc271dbe61511ab79a4a79c40a959f65ff8b834257ad8e15679a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01dd999e5ae21a7bfd9953544b5669e788d564ca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef52bff84147e5e0d0c22a5e14086ae7f8a96994b257de8de181f47a6b1cdb5b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f9f71e7ff02a500f87549693f7b9431605289df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d08b3243ebdb2b5f30f1cc6a998109a91ffbce7ea5e7b52eace8cd1f5cd13ea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38a5f2147f9529b6a0acddaf2f978c8af62f8f43 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27468a412864c4548fd8919b26b4875b8a65a949eaf5e98b910d70e7d1fd2872 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fba0bbea8221a712a1e46f8f5d82599794676ce5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8faeb0e0aaf52196c556af96b97c18cc3cf3862122f2335a9b3a60c393d035e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19033dbc568361eeb16f6da496d83cb2448f5369 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07b4dc5021af7e7423bd05c581ce0cecd7319817e942b741ebb064ac369af0b1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1797da0a15484ec1d15c642fd8b80a4b7af485ce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7fb58e063ea3adff859af3edbc5df6aa5f4e214e86379611aa9a8dee12af78a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94f1881346d21a75bf224d01d8895f66a23b1984 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82f214cae29462ee91d6f509ef3895c48471f348db6d094be2760c2a69c45be6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55ca178b1c50e2b05d69c4ec34b821f473c52fd8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c59362bf9df9763317a59393a3b150a8398c55ce0df173e5576a41af967ee7ad +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3528772a1d5569ca23f1b7a5a15be4e4100905b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fffc5f2a39e2a1112f5ecf849f5d3c645e69fbd9b2a5fb47c9a382becfaf12f9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dca12c0073bd9eaa61c6f9928fb8327ca8709618 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f42fe3a67939b7388128445c598ada8c6890c25357fdecc9f10946730719da3e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0865031c1d59342857c1c8feece189fbf89b672f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:735c5e866ec659452f8fdb1d4f23381c5f1774cf2b9917e6155c1162d66ddccf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fefc99ae163663e8177cb942199bfe0ca90b9912 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ea9e7a2e770e7e979650461a17547ab44bdbcc72e027269806d8409b7a39406 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4151df2e0dd47fea114a3c30098769bebaf9864 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d3bb06e3c71fa3a89bad663047e954fcbad1e8223b8f7304a7ff77b77f1d0eb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a309e52210a402ed15c93dc806e7bdb455cf5ab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cdccb4ccb31aaa316a44670462caebd093e0a4dab37a8e91c9f57556166692e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a75fbf2e981081412dd5c85ea6c42f3d626aeca2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da73a295a735638481992e68d2b3daf38899ee8b9f5e6f15eab417ee94c46e5a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..177900e0230ddaa017d720dc0b78e72e9c51271c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e200c8ea4dd2f62ae67c2e6d5cd84bcdfe9eee9dc6d23299cf230021032e8a3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53302afa4987ec718fa86b1e056e9321a555c76d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6a8db2aac9307ed0077ac80843933e91d21c8450e223649320dcc37ff6397ea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0a63fec425127dbaad7a867c1566d48cb262bf3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f37b768be620b6b47017f42de552f08e0722893ef55ec5eaade15446acec4b24 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf63ba40507563a56d17ca2218bb6727454dfc2d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e35c695f67ade1e2a30b6623e9acebdc0de10c68bd3ee57625d97e8257b7d2d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da1ae50e140e87ece3930d1a1818cddde328779 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57bee060eefb80bebec0203e5140933bc72c944c434cafcaf7786e55362fd81a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3156b41c935374cde16ddd929bd74447a6d089df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa13514416ee77d5677391525ce4d0fb10d1ffba4feae26a8afd46b8f6a722ef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..18120991cd5de96be1ec64912c7acea96b1f5dd0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db1c6d4eb34e27d9e73ebc7ed3eb4535a4871c81f0fdc5b4b9647378af990fdf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08ca2dd6af88dc5558a8284da9a4358aab561a0b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82cd693eec761b11b87aea6a6bb17e5201c8fbbb7eccfd8de00b9282d31c6d8d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2b62635c6d010068b64eccc53f3e07938d9eddb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9f1ebc49710ad0f0fd322c12f967dc253e72a595165d840387b4b80a17e1683 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c95210255c949d5da2cb08c5b84e0fe743b95dfd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37372104eb95d2f56f8c07349b5767770436329f23df55f174b7a3f0dacdf9e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..60a68faa797a965a839a709fa6027d43cf9fb5cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d37c37f1d38ebe23882fa1df982ef133525921891269bb86ecd2ec6c900cbf8a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74caef27339fe882af02cc2c80fd4b11cb646ef1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4124923d109b7f47083f1b5526fefe75920b98d177460ca4780da5169a4bd83f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b354fc38f86803e86023dd7d7a6ed42ca01f5a86 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db500451a38adb2f2d8f9506ab6a47cd5097aa7cea7e0a58ec58a314eb4751ae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a26b9e7a8a74e566df76366a1550ef991866d4fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24b75390635576b93ac3569dbf369aed706a19eb4109515929a7160c54faa9aa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..15e90df24225e2b891b8afbe26e350daa372f0cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d11260beb79725e5d59ebdaf6e517eb370bba2a0f3542d9d10188c823125895 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d424073de5dc0d6e4d45bc44543e177c909caa2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0c6cf8a9ba32ba5daf60cd947d2a35d25bd06803f8c9b242abe00dd9ce1d923 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e7fd33f695a14ee70b24b9976bc8ac95b0ed148 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebf81510d7191c20730cd1bfe8ce46f0282fd043768152d6a1ee7505ab9c227d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb3f8f74e9e640eb0aa4428c80596d3d18565413 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d4577effae3279f6f547fbc0b531378fb3a2aa386472c0a55a2b8c48d23e8d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..749a319f6e3b8577c7c9027a3c6bc69b4fedebfa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86c3bfb68faab116bd284b44bdd54158abc2f5775e8128f1a0ddf189aeda9685 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de1129940cf77fd3596785eb98a20eca6f869394 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f69b76936e5531f1280d3a0abe89e84889c27a299bbb08dd3a69574b97147b6d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf6959f5af7c23235f8ee15e9563be0710067cb7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0828b3d5896b16769d6869afe5ba9997429e9e97ee121883470d38d3fc27fd48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f9d81b3a622fb33becd898bae11786097045aec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb3b7963cd3de1eab0ca5639442bc5c78a5a44db8f1e4231f7b8c29bca67c166 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..01bb6fd332fe50a504d5cc09bd9f857f6f80a6a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74cae86a60d861c31dddf6eee7800efaf0e5b85d620c45613ccf4712e721e707 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..792c58d74cbb1c40d9960ce8e84fe2a9cc8ae800 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e96801b99f0e5bf86068c991afca296be1cc13918c81ada2d4dc7da8b354ac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd617b0c67d81208e92c51eccd38e327bd545645 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d39f2e2f845c4ecd4a883a1ec8b2b45b72b3064051f11b873b72d0fbf0050be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a46d6a35782901bfc5299a7964e1fffffec113d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41df0446dc32965ab326859b6ae6fc4e7cff1c88e2764c03ba0e8c2bf7aae951 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75d3e6face09052aaf8d1a1109cc1cfd1cd9d05e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e1208c5fd01486c022e92c617cf785b896d319b93bccea510f6ae16bfc8c439 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e665015e2a2dd62c8bcd792ab548300304ef747f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d5b43bf894453c5ef8dc19e45d70ed9348bd6db974129f036959a1dee225b2f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec64dfd95214e2151812c2faf70bec06a6e317d3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3e298225678e340e1064f2f77516ef7886dd096824aa87e167030be23c1bf78 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b5625f048f5edeea0e132ff1ff73b29fa44d4fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59131a402bdf7069c6c0194972dd815d94c98fd754f8037bc6347aeab7d158b0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..655c6210b5149b9039b401934a6c958357e0613b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c534323d332319857d5dd90f0ed6c3cfe3fc41e175d3ac524616a006e92632c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..842f001f8069fab1459d8e195a7d8fc4ebfeee5f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556fdee95145d522e866837dedd368dc641591d4fbbb876043c7976a53085b3e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2edfbc84e46296ffcf486285083e61a705193d76 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3929567a128245d78c4c54fb8f1387e73b251d3fc8117d2c72c821690ab7e8f9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a321c32deaa946adfc38ce02d7aa6f96a4bdbb38 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f40dc301e7de82fe83dc081cf08c551725fce4f6f5cdc2483db58aebbd76f7a0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cec0f0c2487d2a99735a48e737d5d3c2336fab8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:126b85ae0d8e610e71ca964945ae21d95d1d815bea547d87ae37ab751b53fd9f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04afad83496a61973ede97b489592bd916957940 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca04fc8fc6c4dcb1e509f9aec6831f840f8527d1192578f53279439c8541d7ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..13c0ae44a2799716ef593f4eda2630d8c7312e4e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8930f7caad589addceeb25394cd465044e371ccf9162044ec106acf1e5418622 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c96ba0fea7b979432f77211387459e57e6ab9ec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48e0ef8b30e7df7a153678b62b3c606987ecafa1d304128686db6d0183f68ec2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..262e1aa8e27555ca580c099671e74d5995731c76 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c451fb09b6345299d8ad34eea7187e66f96a96910a330ab0b1c425861b08da9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b07b3de68813b85ec601831504a74a38ae516ab1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff718143cdc2b2e382b350af689f9f1823a0973ee3ceb420c7e2c5e61fd68e82 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e3b683ac20c6be29e26e502f848d5eee9b3ed03 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0649dca2d02924cdd29b11d0e002bde4ff7579802373f517237b79348a76037 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5889b0493da6b137c7a0cb45ce1d20b17755458 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06e81ec13845d07eb4976a4242839ce334b1f547283e862c26fda9f123829a1c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b23159d269d5784d5db33156fa2a3c69dce25a06 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5581cd6df439332955cc941629894e5e7c86d494fc4ace8df25e3eed23e50b2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64228bc99d449f72c9a70e1a12002a401595806b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:144779589c00a03a58e315f44c2b1bcac3e8e77ed40f5ab6b5bf435d78da23be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5c58fa42a96b70b521f8911351b0046640e406f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e07460534f33c8a17db473999787b0e07c031570a9644e53d880cac508a85abe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c859e04341040e4aab4b5a2f13a588ac5c39aea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bf9988b2774310b280384a321182a6cc0caa0a256ff55192c2ac558d38223ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bb374530710c3cb3c52ab66effa67fd15065cb7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7c138b46b9af8760b0e887afefa1a910f3cd181623f4328a89a0710cb9846a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc57ffd9f4326851160b8cc522bde68a7f9d46ae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:985467480312ec61e304a032585569ef4afb3247bec8f507162ef8056447ff61 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..179cd6e9a82c5e7ad2635c8e74e2f48ac146fcc8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30c02d9ba716720e70b611b6294c927e2beacce4e403c4b30afebf9ef5689093 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f1b4bcef606cb9313c4808595a068a3a1065098 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc71e380cc176a5e9445ca2ae660bd288de1ad15d139b88b846c5eca7c2f16cf +size 11395