diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78e3093b36dd3cc329afe9582b8fc26c0e74031f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f95b839fee2461681004d4a5425253fc4ff47b95b8728feebdd38d4a49b208f +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..885c581af6c446b8530e012f919c7bef466729ce --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b63103a712b785b68d04d81ddd09dfd3950a82aec88ff52cca41016c08188b59 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af74aec94817981985caf2104994ae43b0fee5ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:956370cea0f91226bc84904e504d8609ff637129b937a5f53190b06529edba4d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff8c2ca409ebd43b34397e80dae332a4e0fa5c07 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd02b1fcddd2f1dfbccebdc1bf364400c833424a3c1b824c5a3157c225b60a42 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72e59bd616dd03a18c71a71fe1071f0fcf0ed36f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71238ce45c255fa153235b69f46f8d1380eac0d10df772b1c2c842f64b6c7a9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..491260e201202cb87046fd8e18659bf7683a2237 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd2639a735e455357c2df97ee6a84dacf6e37414affec51b515cc29e52a4f333 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3418ec6b29dd32c4b4c86c957a8c9224ad07d2c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce0bab5363ad9e6c8a02794e29c812c97bbe019f6a56f88bacf072f2dd33c34 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38c211b75126ac333f0277044c0df84d59038b42 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85f32baec6b49451c0c3df83dbbc1fa608bb7cd1fb34709b247803614aebed8a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ee0235771f448bbda419a8518aa9b4188667129 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70605bb924d388c3d660f31c40382c7dfb4f0efe2fbc64823c84c75dc3e608ee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6f071fa45a7e11ef3143e02b0473c26b69489c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aa86cb9e0541c3a9b6f0cd2007a825dc265d31f69a055fc00ae92017b4a2818 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66940319aaba1d91f4335d77d1b18e7d2b4fd2fa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81a7be0355f44cf0bf11734e613727503594e69f690ec6b9b07d2a218ae07b19 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57c956c9b649c8626c59b324270a99cfc2627cf0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5afba05abbd249e1019569d6ed8cc9fb9a35d3acc1ca94d39ef2c18d25d6c45f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81f0d37743994e860b9fc0dc3bc3332db2cc61ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cc2ff35abb95abc24e153af8a5f94b6c5620709d27c3772814db9e5cceab56d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4721fc5d2ca4055c90de30418e5c68e4e392907 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9651a39c40369cca2e984a73f3bba58730427fe66187bbec7d8d510d5e9b024 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6911c5822e484a8045c0190b61fce84806caad37 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83f2134b2592e6fed5d8f55fa7b5c7f861035b9587f71807ba7e79258d816214 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..185f14e2a2ca0c2909f213a2c7d04e6b90a68826 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bde7646667b7744752a569b72c205b352551bba0b9629c17a601defdb25e3508 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e13f42f01fac99eea4d68644f3ecbd7fc1b50cca --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015c905c3299b369d4d797a38caf6b576fdf8ed304a88cdb39633bdc4d700953 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4773065fc21fa942bbd247edb317adb636001ba8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2abb234e5ff2a76b0b4d41d1df62c6c1ea738072dec452d1462d455b1e4b5036 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1075b55ed2a6495c3f4f127594552d24f882f9ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5fd0f818be8d34d076faeb3214fe309a2b2499e636a8041161bfb082a4b065 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..425b801e5bc8ef1d9fbf484f2bcf4275c5ec94e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dceb4c9d2727f470afa43543ba852c1a0c410aeb17d86bb412b7934011450b9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46f6d2d894e10ca0b3fd5f96414a1bc157625b70 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ca13ad82c2b26ac32efe094611dac76dc1bbc9e5e239174a86e918d9511f281 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5c13e66d81882c0a3691efb547074f9c29094fb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71b57f70e225ae867992f4cec71851f39a1ef2d8000c7ba428b59e6f3a1b65d5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d29b5ccb27bae4bd58c3fb8fb15634b50660c328 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d4475868226db04e6102d0d4591b97bb21a9b6ed2246766d62ac26aa4ad1409 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b788ff8d24a3977108fe0aee57551f108d715671 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5892ff9e93877ff1faae88b9f7aaa33f6e928a13440db6877ba01e74857b342 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19edaca1c6ab52354664bcd5f2cdb1a73e5e43bf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dae7f4d3eee2bd311124de09012dbc01833536cb34a0e74585fc860747de6fcf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a68323e7a20dea8c8ca398e2676c9a90015e75f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec84466b69dc4fe2fdbe82b22b791295fd7bdbe0cc33d4de662bf451dd0619b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aabc175e3910d177b5000662215dc72f98398895 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db91b05a135674ef5e02d666b1f06bd2502e0488d4b5f5286c2975615caee8c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c07b51ae6dee1fbd1bc361d0b9035f3eef6b2e8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:549c7bbc9e601238e6fd2444aad3fc5de192c3c113d4c327b3329e3de505cf44 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89829873d850dfc970774fd488874292c4e1864e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bb2a6fc2da4bc71d6e56259d815209106c3fd510dc6dc905771941bb828ae64 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2a6a64d06908dedb1ae270f1e7a4f494b3754de --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4eba82cf707a37157fa5cd929449dcd111ffa351004d4ed26a8df122168c866 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04138e64c853115cf6df41b795a04a146c5cb92e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42e2f2c7a3a49bb9f6ada2432da8b855dd19dee7175db769efb62e3ac3b9f59a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca4792d156469968e24fa9cf9c4e46e242722e17 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c5746d31246c875ffe5134774219a3df410b224b6ad42a0e8e69b1993b81290 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..795efb85f1bacbd09e8611d8978dbacc3646edcf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba2b507a6da813bfecb19c259385ee67c4c19645c12973aab27d47d5e25edf0d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b52882e744a25f3461f58963b3a214befdc34c9e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d08510706c016f54d7e76a26d179c4cb4d6b6ff002272c2cdd127f3577bf8c9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3df010d629aab578fdb847d252dda84f95e8196e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:729a84e54b4917c036c5f96f6c375d67cb47860dece09959c84c80c40ac3f006 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0a9858185916b29004518e28e36aa246fb5ea49 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e71595d099ee767841fb35e8a1d987100326578bdac471067b0637d5ee4f4591 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9addff893eae331800d3d2d0db665cb5edb38b5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:324fd7fe46889de7b361fa5fa3d44cbeeeafcfbac47993acf73e717d917ac863 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..401bcb9a8119fab9f3277e29081bbfd300f405b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:718df8030ccee14db3b2fd8379a35c730fbece230aad3812af38c9d4e159d60e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c458cc104ceb313ab59a4988a68292eacf9937f3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4f64b8d38e03725e28bf964bc7c72930d0061c6a54c1fce1f3855f56880235e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c91b5367a67fe59fe673c67375912017e19e3b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcc0328f4af65d64f75226c25c535fbeef4b644b96041eeb60fb4eef5c10fc55 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be5d457b7fae6a55030e7da6822eecfad25b12c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e248322decd157d69553548a2e01dd01ae2be02708d3eeebdcbaf2cf18d20f1e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4865d074ca5ad8eae14344cad9f989608846cf6d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4bbeb4f054ea48f7d3cdf0bfc57d57fb70dda4b2d5b23ec9e1019565eaf61aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79e605fd18c159040edcb28d907644c838293959 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fbdb282ae519f482ec0d9b564d93bbc43964a436464f9bb0897d8f63bbf44aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e379a0948843a7a72a97db3a792f1ca57e62d2e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:075daaa7d6901e3cebbbb497033362bcaa5ede4a0e1de90dbd758a294430b2cb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..677bbef2ef8d27953e0179bc4eb67ec42bdfefc3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af54e4664be52d9b7b96e02b92da7638d5c77a5708013b5d41713b5a72bd2361 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcf396a48e1a702da714a4461c11b7b55af4e160 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3014ccf679fbaa8b0e1ba5ce4d87b91bfd22e0668f992af35a327189e07289d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5923c4977bb5d4ec939bda992db8273060c7a973 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca01aeccf834311345c351009a256b0a6aad2b48d7c5278861554015637ccf99 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc5007bbfbac3ba35fa90d9a2bbd100e48e61b7f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aeae874d682ee41aab5fad12499a2e0902a330e686a9b083ce63bd5692991c0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fefc36ec92a7ae08b4c3224aa67df4436e8cd13 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d21b4fa9a0ad770f8f5a8c763e4497f5d07c317dbf9d63d1d90698dd2eb3af +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d275db685ec574bbc9a34870811add8671368488 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d794c61c54be0cb42da3b6365a20452bfd68e40de68ba1c7c4665e8b45af122 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3ea3bc730f1ddd59294dab3c6d073843a25af97 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fef88c83d62e7d8bfc44a90e31cb523579f2c118cb9eb497d0f20736ff7ea67 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..093f628e30ff1b4e754f2fc13bdc49cbc99ddf30 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bd2ff998cf6e132c5ad12e750dcd88defdc6773cb9c092ddfc920f8ba624644 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f01535aa37425db5bcb75cddc428f8d8d2c89b06 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:864d0a80e3dcb87bce58f20dc2dbb8918234edbe630322b753c2274cbe78b127 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1988d7de3716e0ef18cee141d8bb27c652702a12 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78a5e25677c22a0552967cc80dc1b8f9eed5dab1ccc31a2717027cfe14eb86ff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a360f05f17a7bf82a2eddbef9a37a3c9b91d474d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cb5382a7a06c03d060b0cd16fd1be2bf91ff4e112ad192adbe574ec6b0c6379 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74cc6337e0311ed902d2a20a977d199cb1dfdc17 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c3e586cfd1983f9ebc83e0b38b0840be7ee3d396ac50f2846083313719bd0e7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72fd0dbee5fe979f29dabc92e861e339a3aabc0f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a2bc3e7046cfe7e32ff66e691c07350be122d43b8c19948d5d90df81398ccbb +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6d58199b0bd2e5cad51a348a08df395f2f39048 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23629976b6aa6a92e85f0e0c3b6ff8996edbba6b5eb4500175dd1ffc5a4f1641 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f43ecc2693186ab83e405d8d60d44d4db91d5ada --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2c75a4c89e39156e3cc9c773fc4143feb5862d346ab2e59cebea8e5fbec52c1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2799687b5405e44ab79c36503410d12033b2985 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6596cd89be4312c5c436f7361d3e69021640bdf692cfabfb4e422a7511acb31a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61a39fe5ac7495c7484a434bd8234ca6cd5b15e5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8e1f9f853ea728ed9db15190d8750ec63648e9c6ce2df4d901af57d8d04177b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e353de60fcb8372c44b094324e397df549c18b02 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3354b8665301a8ebf0d4be99374ec14cd21c9fa656783b0e0ee04930e03103ce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edee42bfebc931ef98fa62f347242762fa5abdd2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ead6520fda3a2fe37760c5c4213278f5bbd85967075fdcbcadd0060161f8038 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a47b3fe05252f4a004ad139c86e352722868269c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b75a6a34a357aabf1dde1108761ada5167623f757964d53b4f25f6c7ec70516 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c141255d26e50d5124d064e7282ed4dfe2a5a121 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1239920e040806538442f5ea31bd74b7ab20c2d53b0a04c1f64c2de514af6c3a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee7ba2ab12b69686260f2b79f7b34bc0d280410f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95f3ae083872c2b959387d6aafb6c8c04c1935c4242c3dcbe90d454ad0cb9c03 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2512d7518de565cc07e556b1cff3fe963373a8df --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978f3a49f6d0fa95aa60af3e09a5950508f285b3b790cd82629ed7efa883d3da +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7afb7d6ed44b518bab2cbb7617252efbf63bbddd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:230ab69cd58816b1620518b3e10220a6ed7b5d034ee39101448a33f828de6706 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2483171b55d2b42ba66efa33995b72afedd71ebb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3419b1cf2d2f1f5c47f202b4189e955dbd1424b667c5a37996a5471d13a4a4b3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10209892cfedb710e61373ef749ba9c4a5104b24 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00bbbc1ea9b8004889483249b823cd6055c29f9fe0df0b59c7322341aa1150e6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5758edbe33f852084b1ee5028ae9c0ae8a47b2a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ac085a8775e40b95b09a96bbe7fe91f6072bf8f694956d0691f5477dd31fd6b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56a8d148327f055c1294ceb90a437a284ec35e1b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99af39b27325656ae9c5b6392baf60ab2a4749defd65113bcf067f63e7872d44 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8e55bd8bab3f8b780050086b9783f15b2a32a5d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c730982aa479034c94d5608a4f4641d9ed35fe335ecbc10270b5e2296d4141e0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74ddbb7cb983473bb9bb1c5e8ae79fa89ab8365b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:899e8c354f11535ad70c0d5585d7a565c9f5057d17285b5ceeb7aaedabb87841 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57c7c39c7af0144e88c379e6b62205c554f3647a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41be56bf4e04f3132bc5db86fff3294000681ab96e48c3d948aa2fb64232272c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4f64538098cc2774fc70550a7825a2817497907 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c034d53275f8b77292b2de57dc8c91573d0a0bcf0caa75b2b56a1ba1e4bbb110 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e88ead6649b62a8fe2e5e304abefb9c2f16f2bd3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d37a27f73b3fc6d655b3660438730492f6b9e59c94c04dfc1a79a1d72db918 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7a11467a025b3f703779fb80ca7e8acf8449c6a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23fddb79bf522241a3b812ccc67d852c4a8a17dd19f049c4c1300a310caace32 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb2376177eb0d570d1472282d75b18ff48a96dd2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44c1c40c07a05ec05a31fa82ee339a207dacb8aceb345dfa9e6c9c0d29ea8ce6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8564b180dc94ce9f431e2f00687b03f175412779 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3cde4fb50dade263aff919c638ed43b6194ba8c79dcf938959e84b2622bc007 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d7a4478bc8796219527d2cbf52b59f56aa1e2ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5036bb77ce87be1d80f98905d0e08893d901b6e0809a7a3e98426f97ea18669 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a90b4c3950672eb8015b6f5bc7dc4e507560674 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68aa7bfb60f5f9292e7d18a363737b4d74c26f0ec5c29a6ba3feb2b738b7eae6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4c4e60ec3df26e414a948dd33889540079c4a91 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3308bd2f7b34d1ef6a36f62ec7e189633c25fed1a352c6767fa3ab2836a1cad7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1033dc3ea6c848b9652ddff1d2112728e1e9b554 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9217ecced9ec2b51048131091f4dd054408730eb1848214e7e5e8f306ad9b223 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ded88533a4c4bb0fd2ca517c6deda089e0a279f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad38707fd31d1da44ae13bd9536afe404a3eab95f8c7e0202bfbb3f69df381a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e44e583730868631d3044a6a450e23f8494b877 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d7b66a40f9bc56cf06e46997b623692fc6cdc44a4fafab13889280d2edac802 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b196f7e00e2934472eabcccc1364bfbbecec2f19 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1f3b2a8d776738bd2893dffba0014d5b268a8d211aa11e07d04adcb50c92f42 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceca113e33e56940866e717bb280a4d749b58e1e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afdbdfbf44b4c1458b80154a65c7872b622a1e15dd53db178c7e9f9c8869b2c1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec4b7e37264def5fe81268bee056985ade786878 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b37080a051b594c4c2f6b4b7852b79083a49470bac627434e98ecfc77311ce74 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..071fefde0799627aa05cd0513623b450d82be014 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83476e473b0991be6257ac431707c79369ae9cb84c1cb26da5e6e5f82d3c863d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b5106676b3e3d1d429b5695a07699515b39a1cc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24ec672648e4beb585715ae4b749b81936d336213773893103fbafc41d77a965 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3472d9d28a4ace2e57fb53a5af884fd27f8034a2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8f20320000011b01ee8a633ffde8435cb938bd1a73e731b37b5f48d47d30a5a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dea75cc90fa66de70f14d582bb8ce33bf777573 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24bc41d30123ad320372f55a513d876c2fd4d578a68f6e908296d955f33dd4a3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f257b6f6e8457cc87be0263a66cf9e1b1ceb6017 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2029fa1796d41c879f12fd89dea9e721b0695c01058090d6e5952182f7fba3e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2895c1f21ba549a4ff95c857449232bdabc48dad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee233db44fe856e5bff6f868bfd00f5c67ad94ebf783268a03d1233c2cd0d463 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa4d6263912bd99ba0e568ba3322412a36aba8eb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d05595b37f737789ac4997273b060489bbe6d39b0d509c640a96e76e49da006 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25c260cef3205326889ee908b1aaa29803cabe3e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fd623185b03c60795b051378f94454d23618dd06efeffd505fa5e0688d902f8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..313ffec8976e6231110e22aec7ee61d42fd141e0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:446c5ab19a00b04a0ddcf8f0510ef155bdf86b4fb296fda2da8d57f80aaec917 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec63db2792a83af00c12c8c0a0c6619747b4f616 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b331b7eebf970236fc72918dccd845f53d80853a40e3edefcb5ab0d94a36df8c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..511e6eb4977c92382c8fd53d7dc68ea65882e41c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27acbd673debda76bf728c6e68c0a2b9e3bde9a4e9e4fa641761f47a7015487a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f36b43d877b777d11f33e7a22b3fedfa625849c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a5d5a624ac762ee5269dbd30c635783ee6eeb060dda9aac7551b553318f446d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..682381d46b75194620f31923bac46ef224cc623c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7a1e84bafc4610b6b33404d9af5e461efeb1cfad312f8b679ef7ab7a89dd3ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39ae391675db1f1aa1df15367e19cd7aacd8bc0a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:603aa6c71bdf32ce5a9805b9e22a7c1541dc6ab7d6b9f6439a09c8f19c4a8641 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2634bd29ca1a0c416a734361838d86a22603941c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e8cc143b0c2da845e4ae525ad610893d5249686f762cbd2f968d8d97cdc8f5b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07aca0370009370f06229a333296d7a75e69a411 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41ffe272d96312fd9aee8dfbecd59733dd6b2456ac7fa6e190c0ce8ec995eb8f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f32e839b4abea163bce4819e0e2729e869e63e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00f4ad49ec4fd46ac896a9b591617645ac193a779aa8b6c7c080fe36c463bed3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c053ac70b32dbffff163925f79aec341a5e2837 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55fe455d72029315996fcf6b510e6edbbf16a386ba88aed58c91b7613958723a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0480d6b6db49a821c5489ed66537223c76a81172 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d85cdef84b8bb444f4e23b89af3489865318b8ca1c1afd2f65a925a32ec1fe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76865747175facdb2953dc21ca599c7c452c5f32 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc6682c130d4c1f3bd0d93195f938b9df0b76623c63e377fc82ad9813473ac62 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..952fcf3de30afe66c3557c64041d68c92f28fe3a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eed9f7d7c2ba7cd8382030ca472f2705f440d9a266bff5e0a180c66b0e68a36b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..891f374435c69bc8c65dd75371a40a70c2022955 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d5556cfb9c62a0147c7cdc172f699e5508be8ea5732c9163c154d38efef6d0a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a29d8c8e2f6a0f95f5aabb73145c096d36333d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2af6ee43c001cea574cef0480f244e42757ecacfa93dc01cab3f9df9ce418dd3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14441b494b5830e2dd0ddb5a3faae12c7557648c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40709b52b885da7e665bc44b03da810c507d5f987c908a73d9b24469e9b3baf7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09ebf5e201cb1e0bbb22efcc28f5b4578d439dfc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee6c01d820169cc743f8283b9cdc521c32a11452ca0fa828ba8f7afb994435a2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..398e5b51ee2ed20d5bcc6eafa09930bc3fc48005 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7274f3cc03f253ba2b35a834fc33d80c6ef6d656213afbc11a4666b28aacceaa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a708b7bb688b3b4e33f45df840ee1024bb57f3d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:195467425d7d7248337b598cd6d0c0e39e0d779932d0ca3f36281769e391e582 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96a524a2c3c8f4ee8526695cf246fed119f11bbf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7065688ff494989a8a7ea75a064a37510ebbcb00b5bb0ee3aff1bf8d9f26c9b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..339e67044cf89f0b7d50eab31a375eebe93ce441 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5afad2d48ac50615b08454f6da72d2056f251bbf1709e27a4f246b6170872a45 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1718eece427ad59c8b89c908a8e48ed1c6b84bf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8716896d0efda7b00cb0401f15f235bc550d45b0708b00daecebe768bc6b48ce +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab0e2cbfb48232fb8fe8b7507f40671cd5b35e5a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ce4608b080b2bdc053b13bd7a27522fb3e26254844106e8b28a682f2c21c79 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c58a1666a762fc7a9bbac42216853c826242d415 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0ef2296e1f5d25319b4510d8b2cf25b25209ae0efc95226c2ad84ac2ea9dc27 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dd406e76fc7f429ffbb7529b325f285f22f5a01 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4686ee4055ba9cdd8b87e50115ca37dfa0ca9e47c57b8fe082e83fa0814fd6f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff22e8eef2edcbd5784a006ebbcb3278a953b3d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cdb0b206a89c52757b3e060e9b681a975f817b61f6503b9d668afd63421a019 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..641f63f0d38e9ae5becac2a3fd5addb0ada9250e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1713cc24bdf0d02105c8b2ca52bf2d429800676488c1342027bc52c8c16ec40e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f11a43fe25c6e0888eb275667f30a2b5c2fdb5b9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e055864fe2dd4417a8550ecbd248f12785b6810ece15ce8149cb3b43ce08e207 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dfa0b0c9e2cca0725c6e7670e152457808d4ad5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a36798c8d51f778de7b4da26bc7d5c42e4916d9f53e73993cc403c74843dc57d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eba5babad91988a3c5aaffd4fe9c0cccfea0a389 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8a30846559e63753a1f18b435f20191cbb917ee6a912f44ce788b2a779e3819 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c89c8de8e3130f56d3db4c33e5270e78dd297570 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7881d2125af918605755021cd6304f14f4dd15f0c0e224516b4ef06b6811921c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bb64d8ba6407ac4be9c7649ee968c4309299558 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c419a4809bd5af3debb642d762f2cc9241804808edbb2a76c85d9fca11b796b3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fa97b82d966bb038488f4169cdf12a6b66c8479 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c7f4a2d58e03ae38fa74c38ab2af32bf8a486874a48e88552f4551577bafa50 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c936c018b0c4afcd926bdfe962cabd1158d905f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c87b9d7c83cf80d62ac817773d5c70d4d7925bcf043ce288da259234bf85a44 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8358087ab7feaf126205a9590ce8407c29c4172 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca3d50f3c5729554ed31424214d997785a5e871591fa6fbc88310fdedd3bb49 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c812d6269da7a338705fc6868a2d7cf373bfe383 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d10b26eb203085b8362f3b5be36579ecc422c481784b12435e85f9e021413b34 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7f2ee933b45e1551054da9ebd555160237c57d0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9ef51427ca57e453deba408a3cf703fbada75473c77c3f481ab90a80ae60dd4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dafbcbf27ffb35c99f3f9f97355d95fb55a5090 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c816daf3416f7407de115a048e14f1f275d0c3bf65f7bd81ac7798733c7116 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48e9d7f924387a4b77e3994740e7b868cdffc8a3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d5c8440a07e478eb7c9d7350c3fb9c12697eb2da8c4bcb90dcfeac7ff845e3c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecfa98d7aa2bda7dd0947ec55ed6961c82d00f9f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebd94fddfe5a8cb6cfddbeed7ce7e64d991ed5c576dabae0561d5839b1c7e59e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a9339a1209dfa34e246f06bdc8eb81fa2e32fb2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3b3d1e77e3fc5cee495c8f17f45bd2d6d11ad39d165b9935bbc572cfd688aca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52eb3b9ba146f5678d63bca4194d1ff19a2d3ac9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a77296e39f1b786528f1a93d346fb7bb939baa7a256e680d2059d9911ef295de +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..68d5feb1878e998bb841883b773190c1a5869da2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a364a929a824817df7754770b7bc871c87f6f7e4bcdf4bdef8e7787b106ae4c9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ddbc6b03f7f7a2ec67e87a29013c840a85aab56 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a65f95cd66b875a78ceccf92205924841f25fab78ef0d18986a98042ef65953f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f32bbd00b06e83983e768041e8217bf0fbe5e8af --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58337facd80366e71575775c2260820f9f2809811e473618bd0cb38f29dc6bfc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ab5715d571bf674d4cda19fbf760f928903579d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dad22e4fb62d1dd7526adc72a0623224b51f52ab7684e49d56639e916b794b3e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a968b1bfca9fa228211f773cd8dee72c772cf524 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0fe4a3f218a8ef2f0265ab2d1f119e444462478b976dc5d55bc0d5aa764e194 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9da0063338fd8fd0f95eaa7cc6573678e5e10cb5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:444a985dad0c0d676181204389019176be9cf2e10d1b059fb42a0fda07f41316 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56b137df8d23382dd546fdcdb8de7e5c06d79b33 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:498c0c7f2ce19b19bd35dfcd85c884e07cd50a01359ad2bdc4148828c052af5d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dd6ca632ecce56be6766ca7558f29527343c5db --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91ff4a4ec2bc43497ac8887211dedcc22d26fccb5b6f61fbb3f61efe76313c34 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d792445c6033e67a04cb9abd8283d167eb6ca204 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303edcb992b2dcc85a534c2dfdaa16d41cf9ad08367c14ab8b21c08e04b9f758 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d41ea1ee5b6f121d4af3d3303c9177e71aad32c0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:560df9d28f762edf1c0c2ea4a9047fbeb91b16660d358becc09514dc0f094fba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4877195f6f6c979b588bf652f074417b0c95b49a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cc364e0db19bdb573f33a3259a1d82eb362ab0b0e847bd7d4d9a3ebf44eb190 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d977026a79dfd82cb7401455b9df586e04a53005 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aabc7543a62f4c4a02ce6f41e35e38e4c2a0e0f45442c33ad81ab1ee9d6db94e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16105823309d93f8ba6d951d47f152cd70af35d3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f576610840a7ebef5d7a78e61c937154bbcc192be2e5479fae824a5c7b8ad193 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52c56bc6f092be1d30a794d5bc2402f86a5b688d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16fd17a06883a1b1b32340975a1cede5c5ad8cac9ae7fdaf134598e526153746 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcdd52d2c77268d46fbf41e6679824ba2721d8da --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:567489adf0d116513bc0824e70757591430535dac891546cf367dcd2ec116053 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..29c4917a6cb33ade942e46ac5263ce25fe23a415 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75503084926be4150d53311ea232495092826b11df30e70b31d566330b42117a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80bc12cabd18861c9ccfe51d87177a82fd9c72af --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52687f2fccd9b86c6527d8f85062ad9781db811133179da47bbdd08f5af21340 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bb22e795e815f0fa7bcee990807769053888f65 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85d938e1674c17ec489321aa18503dc5453b383524c903ae8aef70abf7324ecc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c99d2f5e5993fa7e34d917a250781aaef4e40c4f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a3a678b3c208da026aa8a7a850acb0220564bcf278b32c0e4f6831ee03d56c0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fed7dfae1b3719ddfe9a9aebed95352fe4d974a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1625e65be39b64b153557da4649eec2b2765a465e235d189859d9034cb2d8344 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..899c8599daa48f5d06577129cc739b9c581c9b35 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fab0434755171bb511fd7cd1b717fb1fbf5db5e916c92646d76cb38b7b419201 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fb8aabcbaef53b62af682ea6b43d029de159bfe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f5f90d3f8d725f6d91b628de71b21a02233fe9a4879dc5e34f81bbeb7cb811 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c60da527827eb36d3f93e329193e4fbb95c6089 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:852315214f4f7dc2acc4ba69af5d14b3f71d861c5b62e96043a0bee7d2c62a15 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c00b221f6a6a9dc67c7f1f3e5a6250b8048ac9e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16097249a4a0f03227f4560a02098065c08bfc6146afdc5c74a1c00de0d3cc2c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bc7733df26fb0d8b87925005002f49601cf2a9f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2955c37984758f7e99a9aaa6dd9fd6ecd2cf79bb7f121ae9536e74076d2b6e6e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4168eef3ff9c3c18a4f1ec56707538fa4e7ae45 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:986b472f029172f2360cadd2c5ac7703bde155277114786521ced96ddc88ff1b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91ad3aef061ae45e7baf475dedfd3012acb91207 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f515bce027b7e4dba72d7966c966aac8082eebc88e3d3e6abb1461bae7d813d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d0620069743869961f033ce9edd9e1c32f74e5a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f65876b1af5f2a2682708741f3881134b10aeb452452506e39315bb5865a16d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9beda57acc746f703bc041273caa6649aff5a6dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08fbe1f4ea29fc0c30af45f72e8442422ad40736c1d89e46107a7aac2d6a6cf3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..663b5ae254578237a67e9aeb59f0fb2ddc4380f0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07d0526c65c48e3442636cf62c9ab91c6270939d5d024d70f4e8e643c12a2875 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f990602b0d94f3d3a483557109988221112cb31d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2e72c14c7172b1107b3ae1edd203114de06a5376de146a3315598c10ba9e190 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf195c8337b1ca3089c719968684639ab4aff628 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0732a0f79609aaa166a9b14e0657e0f3e19cc98f3c0637f2f2d75beffbcfb26 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c2b91f6f22986b67b30725aefe8a03b68e7fdb6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b709658dafd447545f49f293ca26b709bc62beca4e4aa5737d4b6459df189fad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a62794cec51516d86d1134984208ac57e1970d99 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5af4f3107253578141894868e8a990cc024897ad06db7ffe8d2c620c4b4325f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd08b4827bc0d514da6e4cfb6a2a3f04e03cbe99 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0354519694fb99008709f6da96569235fa0e1e4b8330398924dafa0567da28a8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6aeb2c75875b7a83072fd5d70273f85f4739233 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a7e26c638af36a64bc00e2d20a0df21ed327065aab6e23829725e04313aa031 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f0a24dcfa499d3c2b046de9e43d6b3977b206bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:521c2c5a7c90bd126f9f361036d72c1cb193e5619653d4dccc381cc54a0cacdd +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96f9eff52af18f2fb99acc652c88516730d47b3f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f21c62c0c9ea5a8fef0f20eb227423e32882fc8cf79a8c2692e0044f2c05246a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a1931bf6a7d8804cab70e310796c31b4caf9e74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfa1f68f88160b38d29e8e045f0a3bd9bca11d9dc356f8b2f1c46790bbc4c36d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..599681223f53d49b483f02c0deb7227fc433e4e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c52782fc845d4bb7b78f3c7aac7fc3a761b8e9f764fca92105d612cfdc8ed62 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..176c44d515e60f7a045da21db83772390e111bfa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edb70281cef5ed60f4c8587c8d648022b916641a80a2cbca42bc81ccf3ddcf88 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56c56a1e511e2e5a8929f3812899e6c67809d889 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9e584715e68b94aedfa1ae7ab7a696397845cca530e3161b48061419bfa5dfb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83c52e4c0d95c2c5cf7935faf9fb815c946163fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:332f645f396c97a182eaa27d31dc74fb74b282af8371b156ee90707fd65f58f8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..225b36649c7bdeed3b9da9819a9e80d99bbe08d9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bc6d9f89f321c9161228207aa1b0b47613d8883b5f2ff1d791c1b91d762c9fe +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf338d541cd47226e9e022147657b25afcc1b253 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9264118619b5930db25d7df4ea7001c997ef0e64a03f5e43a7f31456835718bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6a010735d346092a552db8750a3f518a393845f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b04766faf0f85bc9d2e71b6641bd3472ebfc62578f85ac414f60bdd5ac02183 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3111a22d8f62cba0136370037353f52c529e507 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a37e2d9efa60563954debe2b13d33817b9e6c3f2fd7ecbbcef759f6f6b981d17 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..783384c18021e5098071710eae9be7f5436fb033 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38aa3867767418afc86a093c221b5533d01fe55c3174025384112a554ea7a34e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..937036bdead72a18c1aa12651bb1da2cc62de3fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed4ce83b526900e0797beae79a70c71dc723a9870ccf9807d6b219671867340c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34f2b8bc229cdd98c1e9f5d7e8e468dc58bc44de --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dd8dcaabfaf90dcd570dd2a4d26f99985c301c28ce147e5f2209542883054f8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f124736e0b6abb86dcebcd90f1784564c73cd52 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6a6f077208c91728c9a0c4b5069cffba7949dde65e5941dc528fbb60bfbebf1 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a59e029669b4a18c3769386a368fc57f828aa8ef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac1f4d8ae8b89a53fb6a1ab507303bab2348cd694afbcb64ae6d6e37a9568a38 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fab36a655c02cc24662794126be55f13464cdc4a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:693521af2c1b1eb166f79ab7334bf05fd53ffc6cbbf8e89a388cb31a676621f9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f0276a827a45af32d77bc5065a316ddb0afc164 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4864bb76179ce8bd7e66c4ae8c2741771abd0297022718eda5ff6d208b16743a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c617f79bf66b18a132ad7accf49ef4690a9415f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a88ad1f44bac7ec5fd41150e4efcac39f25e5e3ce0a7b8e64dd530a048bf332c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1d90fdcc56cc3eba6dc57e5d83ebec49b54b9f9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b81a35fa46259e193dfc29e4bbb6e29f1ab06671d681ec785cfb1f1d3cda4fe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2e7a826b9574b8719353365d6e5236ec81f95d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c93a7a258ef45496503198a88b8ade1a7168fd2b5090eb87c8f938aa72ba3338 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b032486574e39e7759896e61e32ca32be15afdd5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64641c095321cf2a48baa8ac0b4a87f7c8be6bc99a923560102c029dcbb30637 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b6c209ac69a17c89c3d548f5b71a355dede6212 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac9ca61ed11569278155571590586441ebe2fd60e81ce44f65a6a349b7a5e0d8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf6709b8f13556271e77df51ce2b4bd9d9950e46 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c6a47c6627d73a742750d8fdeb1b65ade781f1de72818318610fbf728724f94 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47b8c90321a246591fa2b8e75ff5e0f94053f90e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8d07ca761cdf480e3d411f487dd9bebec537deb355306af7d5b68e115e22bf9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbba01f51b44d91945459feb559c82ac1ea05d42 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0bf0305c66fd61056ee65f12cf7ddba4f960cb74febf2faecc052febbdeb088 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2d1bf7c2f4c1c272c20849e3f60d703ab97e8ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc55563eaee0fd0ab298d749d35a8cd90293897befafad3cbda49e2c117f56f5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd53e180b66d777c11ee612909f1785d7903c33e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aae6cbf90fb2cd20996a78de6ffb261fd028d882b80dda702572e425102b4d0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc69b9f3a354170cd7e169202ca1bf04c848225f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fafe82f0e5b41670cfed94d376472bc81c1ec1d570069d388125df86c001048a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09941b71c3c045faa7a33e5cad5cd50dcb0b681b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f1ba29e971e8e95c4a548eb105c2b1e77d4340fca7a119082730de31e7300d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1280a9db50b666d66109085e9bafcdb09360786 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e58f81c67e0c768eccd5f5a3222134a6b6ea0937def509daf5331c2eff182964 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70b102a249929dc21470f9d82160789d1cf4f30e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca91f417d329ae7a68ebaadb3491e770f2f93c36bf7b9ee72481093e8e934357 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c1845b64bf90f135a661333803fed7af094bc88 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ca3a67886c6eb36a613db578cee71e81c0b7712299f046843142f3df7e87ef1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/lm_head/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..93fb5bf6e1b8bee80d0fb3cb6a00619a1e165ef4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aae05f346f72fad201fd0e6084652f46b57e88baacc7c838ef6a5e14a6421faf +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa5b855ed61e0bae291f5b58a1a436ce44a92636 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f01025d9c521a6d2e861c3abf7da1214b03bb93bfbafa83f97e6d7e4824a778c +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f9fc3aefdee38543d90e5d6e5a8716e782bd278 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f6561d73ff162a6983c0f3e13962e7da2834f96f27ad899d2ede30bbc6b5442 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b333119e46248ca2e71ba846bb00fbd76f9f5acc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9085e5995f209b4b250075fd81e69cbe7a1c04dfef6c6cb4bacd2952cd586bd9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e7c3addfbefab9603996d20c6f80caedc0c14f3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee4f97e94b9ecddbf9215503998669af4034ec56c852027fa12a3228e7ec7655 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01ef47dcdacfbcb14c111e7ef9446faaad065079 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6e38531149202681939c2a0363ea3bb570a872708112deaa3149d554b56106f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dba4ce786b6db036d86027bfd88db97f2ade722 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f7ccf51ba5232526f2b244ade551459a531b8949954600f9293ba3d6132e484 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c055eef6f84c3ab3297c4d2978568ed1134de61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1fe2fb4631b4410bda1ad19af0632e103eb20ecaf13928c61dcccb2186ad109 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54163107221392b4008074c9593607049baac73f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b095d66a2634e05845958fe70c950dab4c8cc535c636f941727c6cc1404f5d4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d21eb659f24ca366cc96935d503178b215331840 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:269448e35c0407fdbc3996284d007f104c847d28c609cdbdc2e67f7a02725990 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bbe9a2099856f2ef03986d6b6201bd5b1d5034f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab06ae401782b92af28ac493cdff72f1e54d0ec22f0d99e1e26f80ef5c57fc94 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62d356d767d7fa6825caddcbc19625c86284a7e7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:821de2911807bb472b5fcccd86869f63f724628a612c14a85adb5078d3d94398 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0de6ef62d7970767d8e8bfcc9c3bfb4c5d319136 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ad556459cfb146e316c6286aa87faa5db2247dcba57ede35b54b0e843444f9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed51b9aa3ad386c5cda0403bd7b925ee24b1e5fa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf5b885406167911f8bc443e44c0d2a3a7acc6955503ba4dacd684057287ee3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54f2d1bbdb0c9cfb6112c9066582833443233a43 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b349d451ce04122b03e41f89d557b25f7572339a22adfd977bbda0db62ee4631 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83bb5769e691917054e7c1224a8473d88fc8c2b4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d52e15a7ac7374b9be57752e8ae25695ef66e700b275273f9f510ce26e024be7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28432ebc4538c50325bec33674e3492cf2398bee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ffb1d377aec3d227eaa305a83da9b80e3b2538b62595faf5de23ec6d4e0c9e9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f687c37085cc7bb7641c5c32900ab1d0fe6a0fe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb3d080f747828dba535b88f9d16df026b76e63ec093e865222c4cab3196a12f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcf0ecafa35bef1873887156e7fe8ab6ca2c8a07 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f12e542569873c0624b38c6eeb64574745f4a455f20dcaf3db27681f62ed3eec +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..737a86fce5b0f323325ffdea5b757ad6ede614da --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84724d271f69248dd8b029ef42fb7553d585810e26b8bd9f87301b99b0ca3682 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..411d072f15c0b00c67a2c8f7f5fd55d2bcf2f1d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffc71400a665853b52d73cb629eb6949ddfa3557b023d0781c0af481e8710d94 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6c62f617a9bf17520c8f1583c66f44687178115 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdc8fc535cd5c446cee490926bca0f7f0510bcdb702682b56031d7ff17bbf57d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..057bfa8e7da0e024ae6a983ca3472ffb9f398e60 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3dfad5faf29a66321febd0fb5e08e76b3234ae89a96b3b38b39ab6012a3fcaf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f662864c34c0281f88056cddf1b1f1120300f78b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:956b55bb392fc467e15d01f37fe0ec7d61a0a5eb6f875409a315ef3f9cf90df0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7b4ad581ee9f81340ea69827cd0ce095f523531 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d08ad7fe1cb0e961de1883155596e7a943e5d5db2996d7cdc76702fc18b21436 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9a4b766a7ab6038e6fb32e352457cb27c5630f0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f69edb5f0d075ce53a9acaf3f3c7114ce76ec4c4924975254e23dfe7ef9b1c3b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..227d23df5e56a035c973e6479cb5a13b35510be7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d7264b4b4213c66e92300b71d6e6220b4fa13782010e8548fa6bbca577849e7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1fe1381cbe41b7272add18f158499f694e8defc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17dd81e1b9b0172e3e6904eb75452e52eec74c913d91188eab9443073a4b506c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..95a8211af5090429606c4b44b9fe291a45bad74a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cea77b1094a66f5f8393e22a209b3df50b8c31f88cee2e58f6b2080afa1e89f7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3e6f6c2ad9e23d229dec501ed35bf63d65b6941 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b88ab14936d3172f489588b4a3165a75fa73ec30558aec59e925822aa69c88c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dc3dfe6047fb15181adff6d77e219f5beaebb85 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ee08ad35afea6cdefbdfaec66ecaec51658a0e82b68b345630a822b6cf3ec9b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7903cc3fb616570c40e8f07d7c5b50b3e13cde2c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d65f8d8ed99153dbbeec9bf14606b28c6d1fd0a179a0ecf598c44a0afe64418 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1aa4df8c8813673934f8376a37e86ab385830748 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35daa5e3d37ff42aaac8d094149022c551b608b5d8a4eb37b75e186ec444ee09 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..142a148bbe7d13ffd7d72fc7243404d85bfe779a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73434058abf20df15c0691900a82b839569dcfd48ad43143d82f002bb358ff97 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..68622e7d2f0c5fa335f2dfda5ff19be6992d7649 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71a9fa51af0bd8e440ca39c1e33368ec83a0e3dad63dfb1bffbb52c25bae68a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16f6ac4bbc9c0c9387c15fb44bead1622e37062d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6150b598a637b2b515510ead3942704f8830f554a416432888d74bcc03d74e6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e656884c5cf352945324ee2bf5fa61315742120 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ebd6daceadb9a8853f087b7f4657128f6ca7e7f0be500059ebd9b9fc139abb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ef7607fcd4101a7f1c009fb805ae23fb05b4334 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a08dbbd3ac0b6a31f114c7fda735d83a13a1c27ffb281c97b612429d0155fe07 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaa7a12a5d6561d2fa8d67991ac18f36621b2646 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17e55809b387c9a13a2c5c3b83042655eb32c1e6d1d0726f16d95b864b7a52f1 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47fd612809c016f822f48626095921c219a4c949 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea1bf1f75400ef5294d2ad1dfc16b364067bc8d1afe29e572da87303360a57dd +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a322efca77e35ba178bcf9279a123b910195c48c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b492f9e7beeea3c99880ec0ed635a4a885d84e3b0cdbf76b4e7cee717e8d1784 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0394cda96a4c623587c83092f306e91fe3816e62 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3ef33bf25405b3ea24db2e28dc46bb5e0d94a55c22aaffaacd39d2e8fcf98ad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc264cdd8e56f20beb8f31fe388f17f81a8ebb9f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00292430109c4c44449f264dffdd929539c4f161240ae64483c52856a3276d5d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fd02f28057dddad23920b22145d291baa53fa84 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43857993a06a6aa6252e87b0323ec5a7f3ed4ff0e6204f045448de6cd5e2adc1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9669d32555c2a00bc10bd990c185a919c3f6623 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:136a0c583470b6fe1bfa0bff7581b80e8acfd65375f1886625003671bd54ad62 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..743a6c2bf75f2ea5f5e3f264ed031a6c8245ef66 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:345768d04f6d1f0d8623526e3b0b3e7d0c00ba5695fad739a8ebbc229f81a40b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e53803af31571b685c056170dae923076dc6cab --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad5a9f04bfe62fe5ca566e43f45caf4fcd3ee750a1ab85e3c36c41d0d9070760 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25be1cddfde335107ccddbabd898b983f3e2d340 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e4404327ed2500427a724a64b4fc4a1a67ea93538d83d3873a5b4a45e5b085d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31604e74a1cc38b4f5f0ebf46dc3ec3c3322f530 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45c8caae90cdd2ba1e619ebcac26f4b1f5cde67af6bef52a437887b44969078b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58ce52ca81c8c4f5d6a6ebb6ebf7ca3f6e4aa32f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5171a8b8da6aed1d28b2b71d7d359ddffe37b3d15d25b66ad3366bcedd8ca8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..efd23f0e74df5ee279d2dacd68b86fc60b1c39ec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb016d490c920a0442bb2adb742dd1296cfba699b8ea6e11ba13ccd4cbd2467b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f8310bbdb33480715fb8bab93c9a5a5a1ce93d0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10db8cd4ed9b385f8422a360349403d66ba441d6f62db21f40049005be0178c0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf157ecc88095ed55d7522aff70ca6046c401a6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fed4466dba6ac853f3fc3d269ebca71ac98ee8b492896915edc082dfa0cf5de7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..717501df88949c418d0da8e2d913c5ab5ddf00d2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdf06fadd1bf64dc0b61825b692209b8e0691925038b4cdfc11f346c12032d75 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d65d3e4fc790ded8bd2d2a8dfc74f58a7974179 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00e009ceca25da95ec1e4bd1180c91482d25c1646d85050a24bec58e27243521 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2699d0f1baed1bd07270580d4366cae97f33d37 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d24fda2104292885ec713422af2b93bc2c33b72e75f002ff35d51469cd38d5b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaa8c68b8e3649466f5cbfc5e797f6f24b663e5f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ae09e1adb6835e63ca97119643f90447c9053dcb35b1e5c324db6baac413b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5976b6cdf0c5faa6fe781da71618f414081f1353 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a91b76e51e0422f5c25aa1ba80915b28b4a97c2c48e837d0a4fcee970852f21f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c004c073fff966e1d104cc1d4f08d3a56d12b9ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95827e4c258ed14a2b7e8a389aef8886e32c4108ebe60f019adcef30f7c32095 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97f168305afc0fc3da19f757968c6551e23b4174 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48abc38873ff44957bbf3a434d00e78946799bc43e4e0fe7a62dea6d6ce21ce4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f70ec40ca0d407fcbf94a3e5d1da36eabb59175 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d2d4587625ce626338bb51914b611867a734231ad8034957247d2f81b8b8ee2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..116a99b84b1fe76bae5ba2b6ab3eb738c18e26a9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b859bad1d2b4095f6f359dea3b63267f591486cb51342e636483210693cdf98 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..414fbbe19dd02209b3f8b0c3ea14bb49d0f6abce --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a4ebf61d6e68fc643067f10c6af8f7dcfb2121463ca6398660a2ac78ac18a81 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99ae3586f59890cf187aa36f30e7914fe7fa5d1b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:667df2a06383b26ad7b699fc6b9758c03962d23d671c76aacdd923648160754d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e017cfb08cd38547a99d21cddde7416ad7eca385 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e2cbce7d0732d933e59deb3dd4edba744e027ff763c18c634e51a9e965c5f02 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05add6f34febb106f38ec1e00f4c8ca8911ae5ee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cf9e183e2ffd8f9917feac484eff81392d19c55262bd2c6068c008a32553703 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbbac8b07cddb6045e847bec783bf9ad2ed8a35d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6138a3fc73733bc981e88cf031605b2f8f431c17ea1186938181113841ea03f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..039a485c7f669482738824580ea2b1c652266eee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcb1efb570c36505bcb3227925b720d1e0ae45f6c37c53cdf8e39fb1506e7d4e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..67fb2b9328f5d4f4f5b21a84586ad16c9cf11d4a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4852705f2506fbb6b4a04be81598a19a09d0b19f628401eeb8124b5f9fd96007 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b53b9eea648e855bb1d0851da8b01b3904d74ae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eca05c36b448872a974d6a7245f02f07601124a04a90d92a72656c323357fff1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f21918e7e03ca193136e8feaf1a4b21e26e87315 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b91173935972fc4f2f826d3be932cf8acf1d220bed6dd90c5afb1d665eccfdfb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3011af6472cec90fdc5c9bcb0a1ac8235669871b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f310de2f665b06a4818b998f8e054a4bd7316cf6aa6f597a64c486f03a3ef212 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d51591df21254d07b2e2801cfb398946913261a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c257195d8b11a0ac9e3578a6df8affb717cae854aebe5d96c5c81bce8dc5cc1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b30c120dc68ccbe01fe4d26d0816b75407271717 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ed8bddc385e1b82741a6d098d64d9f57d305b649bb58bc96be97c2e613df2cb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1dec9574a83bfce32ed414c234b6448766a1c32 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0700562f12d6bf464aad884090436aff2f0d9fac84d21883069de3b9916f4d84 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c92557df9c823a1741bbc2cfaade202abdf75e8e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ea36c7eab0db841a7af1f636a69e6d34935f364e255f7621a8e49526ed705ec +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e90053b198a7ebcc342f10d31fc7b50689f25173 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87705deb52f26a30fa7249fd8813793401b39df774282ceabb4a6654975898b3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..550fdebbc0948a32edac921cb258bc3afa47f5ef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71666635bdcc191c836f819f141ded32bf95ccd6931a3f529d1ccac2a91a9dee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4587bad243acf078dff71a6408dfc14c5bdd0f4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1736c1d7a68cec025fb561e58ba6a7425545f83f9bc26a3b423e5be169bc3459 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6d2479999da3c863938a806d8e90a68678d718b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b30cfe5acad409c9ac4f57230efcd8b5d7a3298b9c24b2f82bf00a312a49cac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f84df23f35eef3229fb44f259247734309b64bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47d791d93b73a40c46150339eecf76d825927a1bb7fb9a8d18ef4567fd34e47b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bde0a6a22bed94807beffd0b333a028f5ab6b01 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a4d9fe61da6fab5debab4440a585cc90b8f5a88fd2635145b147fe5acc6d51f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f85e3a02602a89207dadfee5ea1f0c940415dd3e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a819ebbe979bf18c3332a82db46bc8ad1c4682c640161708baf8d561567a1c0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9da64c732f9053b75fb6f0dd3f75f8d5260d8e43 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe0f887b8b52a772b4451b4767ee38c719518eef5771a9738f91951d888b59d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d250db084c2e0ad6b597bd3dbea764750be438d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2782471e2f40e61182bbb6043ca6c2120826ed0a586810e7cff46602108fbc3a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c56bbabe5f050b36ba749bf4717047835d10ea8b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23e41454385eefa7b8d0baece582e7a549e2e711b73b49eb2c15fdce334acf54 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da2225fa3bfbab06ca6490ff33b3a59d5417258 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0436c822839f6fc66a469ef9577c6b8573337227dd382bc993891d740c92df9c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa2d7614b7d6a9138f519dbc35ab36ca95af63d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9cd1541871762eff8b5130955bb81456878b14ae8c723cc66f35537cf38fa5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..866678235bda75dc1d871ed68e627808a54a9070 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74694a9c4401161a1df96462181f024e6ea75b4f787bdcd084a9f3f885d33dd6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8832cb4a4dfb8e74d173c2401e333c3e379cd9a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d26f6663e1bd87d3cb6ce80c24bdf1e13355c5128d421db920e5af16f0644a8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8f1e90552f982ef2d3161bf3d059cef705ca083 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f260a2d8b7bea7634f39e08c0121fce35d95724d4db6f6616444a40499d0864b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55950121da9f0a77adeafd4b0d4c433f8c0efbf5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66a02ad1a9c1b20fb8df0a55fcd28453ae1b74fdd4f1dd8f885d87c8ab33dd0d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db4f7f3cd7ae592ad8e492815a174fadd1659ccc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17b695eb317b29311b40517c19f80a270a7da55361391f765f93baf9a36acdad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a3d632e3457361bb7de4ce737dd6fd6aee96698 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c119fa076eaca26f9646dff086fafe734961002e5799b2ff5ecd084da18c65e5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..56b08725174038c671c670fa444d0e158cf1cf68 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3e7c728f00d388f6423c92d19fa783976949d9d11fb5a385623bf4d8fe8b394 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0579cfbc19363b397d7c3f978f0fb515031e163f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccb57803df8658fc3abbc7b21f44921dfdbded4b44fb484cc1a14714a87ea0f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..531bf7c6266bdf94abf7b7c0e861361535d9570e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89301a73f2eb02c938ee86abd5997063273d5c74223017e3251b5c6a8d4b1e6b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..799fa9a7484728d8f0dc7e1debb1a532a2e813fa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8680ac75429f590a4989fe0dbafc920bec048a0e64957f90ac906e8e208aa8e3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbadafe691115466d58c70fe9f4623d03fb585b5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc3ebf3a7642ed8b2616200f17dd4c777538e34488a41119e7d3a078ac29cf3a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9c2b57e615513905866d1f667c093ff51919a78 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c455c99f180fe68a3c832e226257e25a3095671a1944eb62c7e20a0bd4530def +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..89ff06e0c15adb115c75c30360235237ad7796f8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:249175c80e2c656facafd1f9b953ee36b7d6736201e7f087f025ca619ecd319a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65ad15a1dfa7badfeb7cd137e0bdd9ddad67bad8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ffa4f5a8f1821f704acdd017dc8bb7b0be72b0d592cec9ccf76912a54ff588c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..232b03a51bd2cd4ce4b02703e988068c9a111703 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58cf8dc8712707f18106250c7a756a326852415f910c1b980ed86d54fb3ebde2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a229331c248cba01ec41eaebb2f818993907da1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3640f3dbfcc79cc2889ce9d10f7bac7f11b98577bd073d878088c4ed1d34530e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e3013397438bd3ed8623ca61453b50c5e18eca3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23785854702de715a5c885672c0ef24370c2a9f5268180f682ac19e8624aa32d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ff2bb1c6d96dad90eff3764111d268a8cebdd69 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c5661cfc8b8e17d793b590f913c3fee445225cf898253602e87a11221c13a6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bc7bbf1ac78583067a91b17e2f3dcfe177783d7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51a5e9edc60df72930c764fadcf3f0ee3d0b8970976b839f46653a0303921f93 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..355cf89cfb8d76395c721e203140950e46d38f7e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db33260c34951c79fad96deacff1e0ec12ef1d3db2b77621c118575fb934bccd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f26388c13ff2d595212192f8c01e71021dc9e81b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cda108a34a92edf5ec92542c63675fe59e441e2be5b23acf5c1ee23fdfb9a3e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f0278dfb3d589609adf3aaadc56e96235baa0f6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c06b7527446d4612795c8597e9eade4492232ef87ec745c955467170de5ece91 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0636abfaad3d427be123192168e74961802ff22 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff321c73af2a90b501d61f2f4e10e2b6b96f3d9fefba95b18bc1e995cc77b96d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4608220d21606346bbe0769954f89051679a5749 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96853eb20051118ae7c8ec2acb68f139c3a92c01e2c8c60c63fc9a5c35b38ad7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d4c9fa404fab91d20e0796b92518231768b4da6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:363b02df2c244bba84da3f8537c38a40652e410ade727d0f04c9efcad826e709 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a6848219ee95294ef6eb7aa2f8a123ac54bc48e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34b8bc49de527c6edac7b36e4948ad662f6a0ba12f0c69b612003dd3c5ee30f7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5293078918474e66226e27689128078d10ce9684 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bffc078be456264ea1fa75d419a8d6612d411757f0aafff341c592ce45a4b389 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd1037b2c25a0a0dc7cd53d20610212d7322c7e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a1889a7a0f7ea318393f13e5e1ee9169f9419051068d127b4ca760f792d71da +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de9efc77d911d03f14f9be8f3696d70a1e598ed0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb3e0949c5e21d74a7263ee154880ab3691af4c69ef16fd92e2f9bfc1c2f921 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa88551566cf15e50b482bdb279be9b263da0696 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5347c4013297871ca1852751fe1a3b3c3170470e75f856c074cb050dea73aeef +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5cb094827437d039f54b8ff8d0d0e02d8cbccc0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a79814e4edc84d318cb6f3fd23f30dc5455cf312980fc1cc3a60e3b27b934d65 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63f823a69c0fed852455a37ee9d17df2ceada4a0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fedd64473a83de7f9cd6e8227ff4d31e583fdb98368d0458838dd57e96321e58 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fda507bfadd43a527936a9f222b566282725f53 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7b2da5329a8b0a7df37997a82b1a055935a593a7cd5a6180861e465535d19f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75a4bf1f15d84f863d4f75719c3c552d0f3e06f9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d03f6c1e6fd1076a754323cdedeaf7b14edbdf52010478eda9e19159380dc8f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c82746c61bdf193aa2177e5a0f6a36bca8953784 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:573f9861579ba37372ed6e18043a8dd397dabe5fd21d2887ba1d41b66f5d4975 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64f7003ba538b3ab8616d544452e2f4a18bb01a8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a35c0b952164d9dc91c78bf73765fdd0a46af91ca4f89c5b01a7d42455a6e601 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3dd9214c46db0b40a9b2d5adc5aab3c4c859f21 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb15bd140c5c18cd51db8e890f3855bfb213a37d82e00cb84cbe685ae677a4c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..765f28bf7badc2ceb6f1471e79f65804875ce4bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96418e5d83d32a288df8482afeb7e9487a1504398de73dcb1d4fc4b519d31793 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..99206852fc25e826c23b882ee2db7f9368ebef92 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c119231a1b6b39341a978f5c9bc2bfba5d2eafa8cf87e6af3c860699c3c92d44 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b818ce4f49e5bdd8abcedee0726771560982a243 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8ae52e6ed660963e807b1587d177cb79e69b8c804820203b4012c178a27b8b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30aedcdaa709c099398e3633e74d0980d0ba6fb5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab6daf3224217e7b2459ec09ec1ce2e783c0ebe327506afbfd2b1df0d3ab0893 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20f14e3960d19558eb606e0e1c96e65e06b2ae13 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b994a8f0631f06f7e97adc0eb64ae2bae3a00c635e8eaca4131efe2dd10ecd53 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ea4ca99b5bb301694157b4117582bf00f9698fd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d095947d66b0affe69ca481b59e5a2ab5220ce78b5a4e4744f3d4b22b1f5540f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa78ef3478c869fd9a7dedeb7f547d83bb3d4bd5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ab16f03557f0e8f2b0ee169438fd608af2ac7acd28356917898492e56ef4a08 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31de6268e6262edc9f726240038fb83e1b05a14e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:811205ef778524006b1698b694ff5fd2a353837f96b96dc8e54ed04700309fb6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d479755fd043639f07d3e39aee6490d783d59c4a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f5e0c36fa0c1979df07dadc4e6dd990943071e595d02d4cc8e320370fbea04e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe29babab82198c2bce55ab8cab2b49c6d499d6a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abdce0ac0ea1c8fcd45594ad6a754d97133a33ebe26464bcb7ce9ed5ed6c03ef +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eb2a065b76a9416a3904880f055306538cf431a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f53eb0fb3a3fd7e814ffc91c466ceb57528c344f577a8eac22650d8dbca76e45 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..68efbff9938c2958e776d75e84d659c31119d291 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:967b8a8033a015e8bc3a63d94c786057fb14fedcecdb57e6dd89fc4bd5e15e47 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c35c853c8f1f790695298d5c369b85e4dcf0e810 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd90d1685f9d12c447bbd691640ceb329ad7b75646531b5b700a878362e2396f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7a1965f6c0e515a3d49c45e250c77d8fa100225 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd104f031e251eddd8c3fce68f63ba77d397af0741820dba9e3222341debf737 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebe7b539e6f3089d38dcd8c5d50ac96ad790b36a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e82f7c993bbc4dd76d5fe528d77dda890ec775ad543ebf5aba0748c41e21e976 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d11f4ee91932995e4a9693536a9809ed17d76fb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da7bb341a211c1146dec3627c7e9838da6eccb5b47d2bb6491153121d7ad77ec +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd724932a45a297a829ec335e709e93e9b64cf52 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27a34a8f314a7c07e24ff7ed80ff21f3ca11ec905c5cdb158acc3e5255936fca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f29a94ae8c9e24a821807acf682d218ea6a3dfe8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d32dd4856257cba4488d1dc0a32b95cb79b2e8083799669a9f467b1cbe5d69 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d46d2f0af71bf248132e608931de74513b7487ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46823542299ac30e7f00e132c77397f109224cc3540d66a51eb113eb3561214e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc4856359b59de28f5c5116560c4219a9427d9b6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b52f829a7a8639806d22505521538714d86f04c3128a94d5df7fe0508a4296b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27e2b49a48ffbbf6f8b6da49b3cb3178a734566d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5befd04b094486cf9afd0a3cd59dfb5f81681c81ca8720c09bafed86c880a4d1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f335a0b255f3affb9ac545f1dd7251d33500c72c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:194d8ae7b9af03f61dbb307af6fe9b9365113f5007271c2682c5dfe1d5bcd498 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b650dcd96255657d9599030a43645c2d5cf8190 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f6e26969be8322cd4732e7a00da660386c6476236855011393f070e6f54c650 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03b92ff74338a5c19bdffb9c489d325369b66b60 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:092201a9367c30906f904134596191d3d59e8b568c291d442a43ba8429aacf84 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59a361cb8b6db9e5fec993ba69edb2b41e9171d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee0e662e441702a30689463b24f8e431907713f54dd7106e78d2d224578b69da +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e5c3fddc58daa80c72efe037122f3d0f3c409aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbd8a638b078b5d21c2fc8b610dd8198342a3c316cb8294bc385e52e8b19377a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9cf127c94510b276eb8e8ec1ea461a576eed193 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fa665da895be13e8923ac68fc7b580ebb69eb2d9d103eb6c428627c983aad4b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3112f41dd45948b257b71aec033f2e3faf09cbc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d98f0c06b40f624e45fefed707da4954c9baef9193fbead9569ddecac17bf5d3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91cd283161c13e956170fcc5d7e8476375959d7f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ee29bb3cf852c6ec785b18fece29bee1ddb72303560fedcee843bdad08dcc36 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..740f0703c4e7bd86f4ba4db9530fcbea658200d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0517bc265debc8142d510867cb61e886f5e9e86a70e20a1f6959eeb0a64af820 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57a73bcadc52c30347612c288205cb448a58f0b1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a22420665c167accabe5bd7daa72e84ca3c2b62d9db97b1863102f3f85ad22ec +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63b8182f78736a66b0ad5392b90fa67b85e74b14 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67def52f936a419cd6f025c12300841de7eaca805091b7deb50ecd8a0e88f0a2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc5bf2319ee5b4bebfd478615e3db252bd22bca8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b85531e26cab036996bda65ef29226a35ef88ac61cd1357c683fa6bb0e07d9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57015197ee47e026faabbf58822ce38bd7bb0690 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:358acecb8b66cdfe21540a7fc47199e001fa253c2b59fb53c77222bad2a3b783 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65406dc130d34aa99260782742a211dba8050a6c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1063624fa690403028b107e7214845377210ccea097c121e6a1f3438f0834b7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b960a32d72aab1f4b5c6bef2416d96b289680388 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d9282d75fface72d2a5f7477601c55233b36be1c4b0bf0bae27407e31de5748 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1766c31ecdb3be26edb9a82918a0092644dbd915 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f44c233310c398080c52602109d0dabcf709ddca3b1cbb9b6bb64675457a66f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c09a559877c991eb45d670be7a728047e680964 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8c0848da6dd09f0d8a9464e283d41c949e3502f586b69287fd7450ebf563f7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39d91c4b4709d218a8318b3339bd257a8c16ab5c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc6b94ebec40d97f0dd22fbb10ab597bac7c2f4f12023d536a4982f8949a8897 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c6a0ab029c156d6312a2afdbd8a727caddc3561 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aac8113372e9862d6c09f327e4c12c56e2c1faf368113355849bdf90d56ef52 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9c1a40d755819ad36b14c78a7dff39bcabb1291 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ba9155532345efca25f0314c210a6837222baafff7b636fd0b60b6736a9522d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2b0b14c080cceb42b3d0f6a878e0cfe0f3b6023 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec795a330f21dac6cf4a057d43a8b1d4895720ad58ee1ddad8b4a15cbab8f9a9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dba71aa1914ccd657a8139a4042df7bb98dd8b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d2bbb9fd5a961480f27e338c2ebec15c22329d8999606b2ef4daabf5d8c14d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bac6131169924d1a9e3d6fe3d49987f2fb41f973 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d716e6a96805e12a5ec83a7c1518175feb50e4a3915480d1722ee315d906afe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ed7a9115072cde1282fc08880ee9f650fd8c6cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46e4c7db24b1a9a406f978bb3c9ad0612ae60fd87ab117cbb56070761f22ae49 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..285273853c84e1afccb48bad67e783ee736a71fb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855a6b57577db060abe5aeb9fbab339c57fb62108d0402415328afa00af9e55f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa93c39cb84f111a3ff3bde104c283680293d1f8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:462541b9a941ab57cca1e76e6fabccd48bbc0353788d1cbb2c62a2bd454adfd6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e6f33f267363fe6b5097097ae66573740eec23a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f12e8bdbbc095f2720c39c7315bc6ffa05f4e4d0ef6d2c4e78040e2f4f909e2f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..665d267d6a9300cd00483db568d3f289096438b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed0feb772fd21cc42590f82963054f7831bcdc41b390a613981531eb5ff2eb6b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..745f8712b257caa5633ac2e398f8b12c4c9c64d0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b4cc23ac588386c13d78a1a6bfee276718a28579584fd988298cb4de2510609 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..632e4fd21c2c9268ac0e8454bec02323812eb5b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6809d8a164eb3a85fe2ab894978458605c6c17de914cde991a0c44fb8bd7242 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6860d86438017275050accf4a2a280362df8d3f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f470ab810766a630fb0a5261c584f7ae586aec7c8cada29154f50afe3c6557e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ada66e6f53c4a3cb947666d5e724111576d2d8fe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37a8fa0a33e6012d4d0498ada48639fb68df4dcfc5542f2a330b4266dc15cb7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..448eec3f9a67f9094c4e4669c4a56c90124fab4d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89c5f36697887adfa4ac8a780c0a0c9251b6935e168ed3e6057e47960bb50946 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f29b8651673fd3a0f2f351eaae970aa7231f22ae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b2fb1e0e0e0acd36c543bee80f88b5f888648f3466f31aaefd2c8bf41aa347d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a223e09eeaf4b3fe2da2c5623be9673fbf181995 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc7014173c2e262108e3e51acfb08240fad43ef3393d213c6e692a8a745bcb9f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd5037eeb053f16212f26df4eb64833ccf6bc67b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27e210a41537f032b4a2c35f98ee564684ac61ceba21094edc7bfbfe3f31419a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b5f0d4c6b6a52fd3ee549a892fea0edf8c3943d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f49ccb494dd60890632710bd684c027d79fd688cae9987c557dc9f6ef932bf48 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56e2d31b5e040089137cc5fd228877d08b5ce774 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea14aa61e13772fd92b8d56b2f719a382520fd79c20cf1a59acf004add1d333d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..238c291ca81b9a889de2b02e98e9d2e5d06049c7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c2596ad47c065d99da469822cee834214275735a4dcb5b76f963c5b7120b6b2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3ab7c3d1859707e551fd9100bf50c3311ff16e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9a01ff24fb656c36e78b6a43823b814dadb77b28381b5c2b9f479e4bc89a075 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..93c62e8be7fdf6fbdd1845487f48517489c3ce12 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc41d847a72f3229052b456f10cd3029b4378c9d544eb05661a10c14353bcf27 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ac1290766a0881b2046f4a0a151a28135327fb9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bfbe9d1c2354eeed3c26e291f23e260309781052e0336b02e1e411f0aa3cd60 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d68bbaf476f3393700257faef7d66b3daee5273 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beecd056ce7b4f076f21a0b613aee2032a8708a807dc905274e150bcae21f6d1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93f719f476035b8ebbe6b5b9d738c614465579d8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc39ce6022e714c69de7e7feb70895d14330daa5e715a48beb74dd636b3ce73f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b00368d9c6e3b67bceea1ae0883e9198b050279c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:790dff128092c5d323b611c7f236cc57c7e0c55e0e3f2a74c0fdbab851f97810 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4945220e04a4c228945c201940adfa00057caede --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8352ab9ec5f38d9db16620157803db154f3018c40685d105b8307e90f471327 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1c38df0d87320dce2d9512da1c21063bcd2f97a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b6f1588d6d0ff3f71dec8726d11d18644a7be7582ca1a248ab7808435b66052 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59b96decb919dd690b4bf00d07402f25113e0320 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fce8d3a657e9af8cf80ade03f76214b1f206f0a1bbfc677d1fa18c6ead476c06 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a04ae3639e9c6b1e8f24f47b4f992919f4207ee5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9d6a2eff6cb42bd1bc0fd7d924776c2422abb5fcf6aaba525305bfdf6e2f47 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec989b92c44a6ee24d844536d628f92fcf4c0127 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf9e77a29954baa828064fa86100a0a6633bf1af282ebf239ac89902914d3bca +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef4f2adccbaec68432e7c9fe129a94cfd19705da --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e964ef80002a1705ef8d72007760ce8333aebc10c42ae2f7614ff0f3ca7bbd96 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d82da109c1e9a6dc18f1fa1189224953c3ef02b2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4369c3fc677b7facaf346d42db166c9040ba2cabd86d5771b51ed9858fd33505 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07165c36d06e592e43c18dfffbb35077f17aad42 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:923ceb5a79bf25917a14448d784940a13331b8ca713f5f05ad914dca4ef1402d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8f68e80cb700844b04fa74fb76b681852fe6665 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d8eb0fbc898a18009bf132aaf3df6d74ad7dd8cc6e38dac1ad09bd7bda9fc1d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c93a4cab414f80b01da759fd13c7577c9f98f7b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5077a468d77a9a489e2517365ba4aba5839557f6dc0459887fc94ff237d59e9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41944d570ecf7a70be5d67f7db2f7c6b89e4e731 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a301fd897be985bdf0d378611db3f97f551177514a7a0e2a1dbeadf71e0c1854 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..720651da32dc9a3fff02b5c309131d4f2265d85b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faaddfbe05ad9e3a2ba3c9f861a71eda445ccd6a314f2d5688565fc78f116445 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d672cd04d1553ceabf9bea6af6142d5a1525805f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971337046ed54cb68822bd75ed4027bc0de97e27afd6e1edf883b49d637d6450 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3163c61c2ba59577d9c38819b9d1c195cd1f885 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224e11adc6de59c31726e859dc14a42827da49f7951039c8bcb9982536be1e47 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce825bf74deca9329613db50341713f6954b3f7c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c16909f10b05ebfe16dec6efe059904f86a4dcfb9aae207f33b6695d9bcac8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..379758d815e079ee4b03555afd3b54c0ff32b952 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:432b561ce730c9d667ab652df79c587c6abcf64e1b7687be0ac6ccaa7c1cd4e8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5439787757b7258d0e446b6ad237dd81e609b85a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0138ec0b9087444d3ad25073218fd519c18c0d6ccd3b515c6b284712f0ac188 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7630828e3d9d8b4139bc3bddf46ec0447fbea175 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a853ed87d1d30c4c16e446a7bae16d22b95a6d909f2b6219046dc6604d54492 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eef56c46e960332ef56c0ccac960ab8e117ecc6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:501c89b0471ef79d88f82de7dc11985cb0483e1299abb3a2d6ef4e7eb10aa2a1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d82717faa95f1a3c9ae65f8971176bec8a678be0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb68b7930885d9cf503396f59b60db77aa11238d14edac93b03bd1e3cf31896 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a888deea7e594e9d5939a4f33211fafcf13f1c6b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de2859cf4f557bc2fe0eec0e5d7ba64c9857c1d1e7dd37a0e70a6d920446e672 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cacc5cd869927450855e6d3e9e77989e6a6bf037 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057738ca4cf3473db8f6976002bd9dd8911f41549c689c7e194e3b3829b6da6d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04970859468161aa98dd804abeb6d89766ca2fce --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3970f8e43980898e0255fec4052edaac868360b9712723845d8964b1c706de3a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..61096d1c7fd4916cbea86895019d90d1a5696e28 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4283044671978627e4f268d168c774c79b432d6781a0304a30ba47aa523efde +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5460b7cebfc2ba8ce487356a1bbe58b2254ba5e3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:228a4f737d2ae7e222d7e61f18c314cf443371b1c9a8f4944874ffadc710f80b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..477d85fa69dda2aa3a220008c12f2d20e7d2dee2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8640daccef5008f8af79c396c5a4167416c578987155c920b88bdbb0cbfe491 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e810ca14b9f5f11e77f96398e00439d7d84c82f5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a93da900e4eacbb57e3da8648a8e45bb06e134d741ad7238960a9751eb1a88 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc59e6d2bc5cf4dc56e6989e8581cb09171803b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0eec11357dccfe08977d1a72329e6bf1b405d0130af792d71b3dcb6287d8ff8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b3ac287bbd1f057d193e624eb9b3b0e4521fdd6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af126658f6ba50e0424dfbebe25357e814afa85099553929f20bc6e8a1c9f8c6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd9574a4edc0b617397fd0c40cf7d39cb209639b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e7769de04d8a8d70228452312bb53183db50e88f6df29afdb56a3e1fddb816 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eb3cc86eb9805a90dea2f97f1cf3cf96da4cde4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bf854d7de27f63b84ad9b3d640a8a793ccc644f0df150a2fda2d512dadf66e0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8adbef1fcfbdb81fc8d5e00d6ab0498fbbd9ac6f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:034dac82b66f02f54314db7d7bc8c344602441e954c751737f3ae9d960371c22 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdf1a775ea11e6ff08faab25122d3c5b8376a0d3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42f1560f0780404c4a3a1ca13e381e22cf993c8cc1b40bf3e0dcfcce16ddfbba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..74c10d5c76f7b2004f589eb6f325dea1bbf788b7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a2e7574841f2eb2ecc16c77a4c362bda4be4a66f2a14b93347d08d25c524d9f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f1a5cf97faad75f882cf941d229ac0e8feb4889 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6e958e4aab00aadfe6dffd21f250aed71a2cfbbd9286fa865604b8485a4960f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..701c9cb6e48f7652c06820288882a16a3ac662c4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d703617a8af9a1e0550c50df351007e6fca790ec6e7213959450bfee0be52be5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..510affba7dd3d7f09c992f51f74f80c33053833f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6690f338565d3871f7aabafe0ca6bd516b15e71db3a1e0d481000ea0e58fd4b2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c83aa6a9fc3d2b850f56cd035b35e8d7fbde1d7e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3be3c2130c55f2ea8285044bfbc3bb6c1dc2488375abd78d617bc15d5634a353 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2212d4e5c407143aac02ad9bbc8cb6105b548111 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a7bf9931bfde870ea4808e7471c1f297e10e02f1f68b99b3fa22c14fee217e2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b20360d7ad8f54472b4129c9696fdcdf7b83dac7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aa8beb6422808a649f0993b2291c241e3b0b5067bdadfbbd50a7b85dde8b020 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4e7e1a652711861b3dd83ffc02c1e41731ea0d4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9de44d7370b1648eb73e3d68816e38c41d0a7cb3f8bf9a0c5444de4971be19b9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f30e7af77a121512993b3236bb6ff635b1ed175c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728d5b63653a7999376cd80312d441977d336c13b8dbf437b2bdc0fdb9b6bcd5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68f2158b9eebfc2c6900bb0cec15f4757961f732 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd08ddfaaab56c938d07960cd1bed2183144beab614394c30ea47d96fefc9364 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac376708c5f34503cb6afc712d8f53f9576348ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1df5e26ed2ad07eaa160105f9cb3bf33fb06bd6efd76f24197f734413632ff7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9044b549e1af6dc0510eebff4794f16d2ffb7e7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2849fa36ee33c087c53efa6a6722e40abc952bed16bb203234874436c09bf0d9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33c501cf62d2ac5b15fab9052c1e60bfaae14479 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dcc2917598583fd79551613e7221345b74dd93c29a32dc3a8c102863c093fb4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bebdcbd4d38b60ac367339ea40ac2494047ea4b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265468b9aa2e73190f1ef1ac15a8adce299947fb9bc4b13e928e3fe974afbc90 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4276cf94dfcea8b246b576beeb7b94a787e7d342 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c7551636a4d2ba3d0bffe2d08f460471ad7d0d1e53b5c8b2ef38c8c00e485dc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de76ed298b717e23f10b9f7a086416b88780efc2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d48f8f0e820845933c1992e4176d7dc4435bd7badad29032a55828e1538a27c2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e5a5581cd33b3a8eb4d0660adad9368b7562be8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a3bc442a7563a5392958d66423bba024e9634a4296af9d3b20f059c1dcb39ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1457cd59fb67921fbdd57a4c34adaa5455f39100 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59f4e18e8d8a5f2a909abe2abfb8b164a4f6cd6645e1b45252de7b91e90b7afe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec243fe2ca6ab26dd9661f0946fa3a31f781f34c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327b9e83052dff966fb691528ca505845f63bda4daf66df586456a649a640ca5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a13cd3496681d3d675adaf7fff1bc0c9a148de0f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:365b32bd53d2ff3c75c71b19549c78d1e700a4c1c88b8baf6b03e5170616c207 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08f950ee07ac75e9924b32b3023488bd446a1761 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f0edd3b78d8853dbfb9e414461ea9005259ef58cd17b182ab4fb03051b66cb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..188c03db5b3a73075a42b1f6716cdf3f78fc638e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11d58dad1131d723faa3b1c6d4411fb4703eab47f5be25ea9619384182418e8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..022e965260354c898951b90fd98b2b312173ec2f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1011d612fe46e5115427cc27252fc6a10a6777c5a8d680ce95638a6f50b85667 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f09ab567ba526585c3430f3c724c058cffff638d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5009956a266b0511b75ed6fddff15e06c57fb8d5b1f6fd766003c37333bd08fb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b236ce87758ca72b530a9f69225df46f168b368f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72dbceaa8c192c83f7ac01fec3751bc2a1edf4b8b294e3cf1455c2979c554007 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dca6830997f70946b93a62c73ab6e7f9f7a1521b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a09bc1b59eb7027a04fd762716308beaf5121c939d069339c8e25ac75d8db3d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7be37af1970723671ccfdad51402e1b53f87e89b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5266c700428b855ea96dee4192aad23f964654f579713dd1527f5ed611ee2245 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81c4c6fe5c9c7b439ff8df9965f1f6823be977bf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13d9a4e836725d0f8ead37c67d9bdb191acd19787e69d25279d1344ffd0f18fb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..399c28c9a7db11c128666e20468af5c2d35a617d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f644680dfbd72d15fd006c6528a34e4c61251f63825e14fc5a50775f7175f5ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c7f158532825161eb2c566b13215bfbdfeb487b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15e6e3049b82ca0a3e8714eea52c1e7aa97637d25c8fd82336be7155a5e41eb1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb190274702b27e1a9ede3a5ed491f8f031bdd72 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce03f6dda02be9810cf0ad62e101e9ae8a1786111d623549e355422ffb15c0cd +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23b27a993bb8ce4bb4ac9a287c4dee423041342e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f3c785d24a3de38b8781229a6b5455646cd73993462dab174fecbbef4c63b94 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7cf113d2b31fc80160c734984de0fd59cfdd077 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ae9c7aabc9693d5860e700aaa25f3754638ee2d4249a9e0a389947f45501acf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d91e4b9e719d723b6cd2f251f63565e663fd30b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e34813e15b6aacb125f1d4e5304bb1eda9117dc5ef1ce1f0f29086d2681df2d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e723df0835257e16529f242e24b26a232b0b872d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973beaba5c365315cf7774c05554b9462994e57289389e5820426650b8083bc9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5886aeeec6a73ff2d895b2ff7ac00dbf43c90901 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01099bef3a06a35cf0916b45e4db7c6b98db1337daf5c3805d7147f8e7e5e325 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..234dc04a9f4549646b138d75b8cea361bb6f15fd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa2711182f5159b44e5383e3d7325afb3ef4deb8699a889ab9a4621ccf9a2338 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d43df530e9bdd1f42363b7cd23b8631bbdde9a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdc124eaab77bdd704e05bd1accd223a09bdc0f6f7946ccee516c34c6909fc3c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..844d5599a7f165930b4eb6842181fd2495625a53 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f0354986351b286c092876d838c4583404a9c69a2e3424689adeb26db59026e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a07eb1ee7e5de891c3ffa230c9deb5902863609d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaa158370dd5cb00e1b93dcedac68c665c4a7e1a3c38d70b39d13ea924bdeb5c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..259b3d3620c8f3b7d71aac105e23982e69e7ef19 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c49f2d92e64026498f65aeebfab6c0cdc9438be6bf6fb376af8afcc50dbe725 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e488afc097e4fbbfa251a86a4f24a7d210bc47a9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1736afd74043be9e881391cf1229d1ab27f55f981c506549187549b74a5f9d3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ba0f82786113c7d8fc1a7df4fccf085bfd9d538 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7caca144e2b053b3bdb678066eff567d366dd6806749b2819f65744d2c2a5e16 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cd86b2b249aea9b05a4d9deaecd9aad3c695a00 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3073cf131619f9e9b13e5155294728c215c099e0270e021d74f6801e5a3fb69 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..deab05ed7aabd299fb647431710af00dccf15ab2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d53d96cebb952021b7d129af265beed800c432502a07dbfe9aa7554dd2b69ae8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16299ce1fd07ae8ebed1078ffc37008d689acd17 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d436f9640c626781b7af46d9c55017d7b262792c76c4ca070131a5c64d8434f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..befa5384229c775e8f218da1d58beae531089bdc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e55d7f8e524b270322ec96358b86bf5022ebe7decdcb8acadac6634a0d5eada +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ec68a364353c3002e0a3015b59b225a7f8e279d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ef6e30742b1e5b4f9aac53a92afb077710e602df7fb26a3baadd261162fa7da +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5bf1cef6b88dc4497f06f613b3153e099ebd4a6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:400af494b46e68338a089232b6638c5d66109bc6ec5d65b2566155781fc0e9c1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..839f012d996909f49bd7456bae855f9f0d62e83d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c39818c3e779b120649b92159bc91469efdb79434038adec55c84435be113dc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8da2ca00aa29845844cf22c764e4bfe4956ff378 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aa71fa0483585fc9f5161c3697f7e795ba94317561c2cbd8cdaa1ad64b6ef86 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc74a591f7dd14082be50bfa059e1dfd9f0cca74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca771351f97a1a5e577b1314dc016292c3914fa3a94667c05f4457364cf3a98 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b48c67fe9348373f2d2fc193cba21be5817309cf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ee39bd5a8dbdd2d67ab381d67ea00421f1306f5d8d83d5fe711ff7d63d6c823 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96c60a4d3f0d3badee8bfbd36ca2c7a44967318b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72a266cab516d401911d9a9a8203cc2e34bec4375d7919a2da2aca0d13b57c49 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3759e50184f34ec3690dc541a220479e3de6672 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c4510b49f3e4a8ca42a4f65ecf31197f9247336129d8954ecc1f7e04d4050c3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..def4db2ffafe9fbe53f1a260c817cf0a045c00a5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68662bf6c3ac1c5722aa6ea071267fa4fa362ef7544186f01e2b679d084f9c2f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00013a6a5e4b32d17787e829906fe7ae2fea866d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76500aa318ce18a2bf77630ddf37b52f4cea9a5d422876f8fa2c63c7c9c0e482 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25c1fefa13e6ba769fbcc6a4e24fad32345ae39d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa8ef8d44ea169094bf5f9fb50895df795dfcc38815c22b2020cc61e2db81af +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab0b3a6106f7f7eee27e850c3f8b09ac4abf34a6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bf3be89349b3c985628c03577e92f121b902dcfaef16c122578735bdfae913b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a071a67f2745a9956c3bd891b9acce2141614185 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:191b3dfa83159261b4acf66bc8998c59478787a1defdc6d44394b6bcbfe09916 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cfa731fb2ef5304e728512ee15d5f451644503f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9edc0fc9632f9d3ec232cde979bbb51f46f91df9948f8f5cfae333fc9398f970 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60ac88202b58ea98c683bb307ea9ee08c867d946 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f9fcd5a85e899d268978b3fe60600dc56424f9cf48a8710e57f79fe373d3d86 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..683e50a0405949f37e6303801deeb8c5737ab491 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a0875ac5add8d29ed85bc452fab5c5948108880c8f242e463a5cd895acbf3ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76eddb3be2c0eb11c6fdf15c41db6e06f05e221d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3745ae7a14e9b3c563b7f921978b36f55d4dbed75a76d9c7f3260b6dd1cb9d3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..494d629aa2d133eacae6857da1c13b163fa45ece --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63cd58394aa2a6aa2f30eee67734d9f230e0679c85cd664fb77e1bc4c87c30c1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d162bc9cbb644dc3be8d61ff45db9ad08cbcb2a1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ff87d3179b3f32ff007d5bc985a09bab3e06ffb60f044ded8bb2c75bd55db4a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70af3f9b195ef65e546b267dcbb010efea451ee8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8cbb616d604f4cf5125b54b4206e43c43a29fafa63f9a742b444f6190e92b9b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecee6ab5f58b273afea523bdb1919c01eec7d7b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d75e2c7fcfa77834845ddbd5b452b2aeb9a004343b297b16c76b57fd6dc7e3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..59654ee1acfc7559d68573bb47ee963be1f2026c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68fca9abc5432206a2eb062421cff6432e001f224112133f95ed0fe9f748128c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56a2eff9b3eaaf47074e0bb05df2965b030fea6f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c068d74b22c17364705e04204ab687ed92d95411b33be7bbb98725f20bfc28f7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c7b1b50f2d1b99bf370f52051b8b3a3ce463f5c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab02dc5ed580e0cb3704c5b6de2570233b6a4bbc83a4e393c9f027b309194cba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bc0fe3e1f23adf7187ce2a1036eb673436ed964 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:239f885ffa0b4ceea0c0cbeda207de638ace6cc4d3bbb663bc674a0372367b6e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9fb9ae981c23afdc813eaa05f466a61e49e4f8b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b61e1bc389ad71c622c96281b871286fed8abebe8dd9b1288abeb749df1a13e6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..523ae19954f5eb519154d7e38ab68ed6d5b18210 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3082652985136e5a72a1c18845ee7aa7998c974740b8644e65fb029cfa37390c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71337676c421909ba35fed88ddab798bc8d0c6da --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82efe143dd4bffba6a3fb83a9c10810c61a5e33ccc37332851197657a2620645 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96b3123cda909beb01db2ddc489f37826c1d128c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ec571ddaf5b5d179c6d2e964e59fe19fa744bf1af8a330448cd52a80e85501 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..105219e202874d996ae33fd6b64731e3247d4639 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:506bc28b430638cf58ca1bc61bfccf85919644241021a2091f6687ebcb246643 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b946419224591c41b8f77ab4ba28cf19b7ad2cf8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8818214f4af04471cd23ce7efb7b4166ea704941b53930b02e397ca90b7ab6f4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c386807f325341d97b3cf3cceedd4a886f0567b6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:332c1d30826c0b19a738bfc342c1a8e86757b5f75105d4198c1fb65f017d9607 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..434a419cdb1f9352003fb50795fa40b409c7c293 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:611a0f8c64ffaabd9fc94853305a60acfc435c58aaccd8cf2ecea34a593e6bfb +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55d61f8a4b4676d063d063311eea8756aed97a7a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0c23866888bf53806fee53d8283a14b4e3f75674550cbad1e284afa3eab7f29 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10ee6884533490cc63ff5aacf20dda1cbb9aa00a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3fa59061b04b9a071e5205d65dd38c47a0181cf47a872437309813c8c544a70 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca434fba33c0e8e42dcb03a34b50e8376f9a294b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:304170ba07c1f51b301c8ccfc625c88bc6b91f00b92b461695109db5c84701c1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c55b962a9f4d659fd88d73371a793593fc973ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3938043e39b95754d85e0a63246fc35504b1c54351fcac967fcf88f4db1146e7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c122e3497531143abb243c038a8dd2c82853f1c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23a7254d68b55e13a66817f291dc0915101e90b9195c88bb4b828210d864c720 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d52770ebd61a1ee2ffc62c1d2d57756001e9cba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27f1910d1408d686c14c76f4160e0b38c78a5917c1f0c3eec0f857e1f211c4c2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a1faac34b29eab3d225b5d1ab076c7d3a63b32f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23d159a2c6692e28b44f9d0e996ff38cabf1ed32bd86b81d4b97e1ea96065f30 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3779fd8a3c2adb10cd68cc2387a583560d194a7d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:875947a571d2830eab3adf5948f13de7a46fbb1cf3b7fbdf97d7575e3b66a6e6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..66576ce5e433f19012427cb23ac2ad720ef38a8e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:780bdf62f0d8c3c8b375c56dedc274ad631ebb6cdd4086dc83cc9df5a2eefcc1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c949c9fd1fc330fd3853d4103a39629055240a2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2066a4c93a9a28f355169ab4bfdba792498c59eecd9bbeb2acad4ab080253c0d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba251fe7fe9168c363e86a464e7ab9f816b790a1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e489facf58050dd116edd7be177ab86594aea19d5f7c7a892c75504cd347cc4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8413138c97c8fa8408d11aa9645dcc5636391253 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11f84609e2432c3be776284e17a8295e86aece37c35e5cc937ce98ae30fd8a8d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..12845d140e5d994ab484a234f440d095f95f6998 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93846b4404001914672d7fe69463435ed26ab39b0922d4588fb9cb8daf3a80ff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c702a23c2bc15d94c62d732f1532b1e1296d8195 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4621c65d1a8310476b777d4e4ab8afc6cc5d1fbc2b4669db202b9b46e438c846 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..718ff3a31de4ce6e687102c652cffd42b557ae16 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb29806705434aab7de735b0a3433ab5144179b21b64ccc89b8cccfd98286a05 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c56918510b38073ba1c58bd02f3c19aee7ee7642 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b9c25af59a314f90c93b717c3e210de72f83c8a619259699a3a8ccf28cc813 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbf2daa0d2ed6a7cb054f06c692a5b2e3b2a7d9d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44e5931ef7fe2b8bcd430e7fe47033c945d2cc156e159a462af98a5aec39f2ad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..67d61172b0063bdb0a96b5556f07462b8676d79d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2449c1814e79c60690410c1e349e6d55d5a9e78356e4a83d53ae6ed55de398a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..164ca7c5762b011b714d9e9c61e7004a602d44c2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99fb3e0150f17212e83857b93af09ce25b268d22a8d87368901a7dee97c9f5be +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4ef1fdc7c8e94e5651b21256816a82fab13f848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:669cdab009bd64c204e8b344443ba0e68730ea1b70ecd011e61f3561c2d17b90 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..254b24a576136eea6d074178f165f939a6d4d958 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:accfd0bb117fed46a4a43f0677b67b1ad08291856a480a3746f50ba450a2fc54 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f36458899ddf39725a8213678e30cc37cee27bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28fa3a684504b888b43cfe446c36b62be87624261f7b220f7ab971c788d33006 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb7b92a629c1532268f7e33b813782ff288d1657 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef7dbe924a3b9c51c501134b82dbec1a91596e596900f0cc7a9c612fd82d6037 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d7999f84b89053768fd72d587883fdd7a8fab50 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:957e4e55310e23fc98f4b4617e23bc3b88f228f3208b21f38201060afd5c22a8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f3f75be6039155bef6fb39bf68b38060edf6062 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26ae7a49e073b91f7de94e447f16ad0d3c96a7d51b05704fcf7b01b96d23b79f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6b8bf26cff17383d5d513f4c2b5596310177fe6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4db563471916fa85a96e3a71c87c2b9dff5b7abc9fcd1342c2c32e2c88f6a25 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b09b2efaf81ba7c0d50d3679583130a08bbb9e88 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:291ec8f8be203b87bcdedf09dcece04751ad6d85765afdc20a1f69d176aaeae7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e036f6930fe3a18aa64f589b269bfee750d071e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fd611e6521059ceb0250a60a8416b6c9b36cf9c2a99c023507d678d0a611dc2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e8bde86154092e7ec269d1c7c99482c9ece3a82 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c78d60d509a4eb0cb95f0c2889a9a13dccfb70f15088085c26e147496dc160c6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e19cf0e714fe033b754d1f7286d32c8469801e3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b83fc05ced570647ee592b0c25772e8eb74a6c572aeae5e0fd9069241bec2d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c392e898728a424306d4d7eaf5d99a8c81652ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:381d48d41fe8918c43065ea77b7126559df7127d356c9755113fd6ab0624f3f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..035ae902e28913e5925829f269f61ddad98ecf39 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94135a0da744796d58431509bee0831f58c861c7d36d1bc615b67eb0d48fbfda +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..285cb74658f4baa70d0ab13a63e6c8b72d2beaff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33b39c08f402c04a2532afa1d476141af6abbcc726c6fa1f093ca2ade4cb4d9f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24a48aac61ba05a5d000ecbfe99c36f29c6bea6d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e311b17fe9ab569876ba5ddc30b720f8782ace00e793fea13970d88e5a92937 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd7d207b031d4041592081a00b47ae41eb43b747 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:982224f36874d86344688e242bcd913888557591cd6e0bf0ce3d48ce6c18fea6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d547d37838ee26a066195e0e63ec91ed62b217a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0547f98cfdd8c9ebc62ead089f473cc8cb94a810057df179d322f039dd4b2d1a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de84b2eefab344177d4fbb431605bee3ac1eddf6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e70d2f35f2d278774d0ccdedc7566fc85a41caad23f0d326f040eab876d3fd1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f8fa4f542d3764e180f0b4c2436b8251ea9581a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24159b4a0a39a87b684d20303872900633f11ef6a9cf80b5fb0cb6ff9d7a59cf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1a6ea06809a610c2075b984e09af0382d4aeb2c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:284f51ad0c9bc4f37bbe0cfa707f08a5901ca209ad1adea706e2fc5926baeeba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8102d2b93e557ff42e5f21d4e3b6093d41fcf815 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af1d601738dd219724c2adf64f3d50d7107e34eda77487f0dc6275d3351451d1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f40d3032748f3868026f84ea53c42a4eaed9ce2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b4f6590813da0b0fdcac8758b2b504c1dcd751242abdc23c724117745b86a98 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32da78b69b4b55204fbb4c8b378a1856ecc6770c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93dde59fa2c4379014680c0c1a405146d9eb4e256e89d7c60ba8437e514129d3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a989d6fba0e97797024476f00687ea445e455260 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d61fa92b2c26637f88933e3cc5fc8d2550ff7fadcb43d59e69a039ee098e07a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72a837a7d8eda0791f123c7bfb29d96d9e2f5750 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6317683aeac6bccae047e515c437b5df8e43c36824c7afb4faee1d780245b1b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..720ce00d8c12468fd1877e2356e8ce5fa3064655 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bb9ef5047b235a6fea5031095c47a8a70100af7a98c654fec85226555fcc82c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c7ba24b06914318209325413d6671c01ed5a9ef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26edea53aa9b831b3ebf7b8adb2e0813cb340f0eaf1ac67373cf12ab409368ef +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1278aac47053b82bce2a83f21fcbca97e7ebde2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e28167efb30326e98549bfc0a027c494171231d1b2710a31e6dbb5681eaeab37 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2594325e28fac9c05525bceef14d3b64fa845bf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6791a73c4e912d5fc4d2ae49fa95f1ae9748b8c33577789ba15656bc00217840 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3444912eb7453a3d0c421a54c269fcb7baa67dda --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b469d0e8f303a195b87f18ed30914bb61631b0d520a4e2940bf4c18af97a46b4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c549530c2cfd6e3e1235768cedb7add1251df1c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b01a310508cd1067508cdd173f90d12450056516e77eec237f5dc4bb82d6087 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..82e30560ec71590ad8c16cdfbaf1809140b150eb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:472606ab68953dac404929a67e0bd5f37e0ad100e96f383e457b0e663fa7c6a8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f0351d008f03e153d9a1d8edda09fab8d9ff0dd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:884bc2ba06c5599f6ed4ae9b21918c3e8d5c4bd42256aea628a88c7aff94fe33 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..22cc89d253a364fc6ca26ff210f9658c7e64315c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13058c470dcf0a3525fda1f550d85c2f530175e86827730b6c142c8264869645 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..027363f7ef28b1141c3f57db1dd834008efd7845 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32ff92366a34e117cf3c152639348548ec5f29b61ae5a37d27dd66d5161ba6f4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c13db5b061f5c43db73b714b04c418817eef595d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f10caca2d484dae502c41c916653e53ba2eac107daf386387438eff32c9f206 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7442285fd7cc9cab8d3ea092274243045395b1c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:037ed1d6a8e775eaff39e8ff0592455362fc11eb13b3fda0340f85f27e60aab0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b929be9473696a2ce8813d8ed6866c1b3ade35ae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7418883927535010109d85fe5409cad051cceb0757536bff78579cb43c6f0763 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96acf6c9b1b5bcd34ff090b8ad368cd005d928d4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ca0dd2ac196ed8dc696ccd3ade36d0cd0b1761c901fa2d120478e223e30eeb8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..089261c6f6d96d608f5ba5f446985f6a3c961187 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:099bd76aeb94ac1e921707904cd7f4bdedb6a99048758a5993e1f9e62b47d473 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4481ae22437142d32a83414784c7a0a45d849d9e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c649844a5bbfa5a51a4affeed9410e18b6b92b9e00fe63069fdbf561762162c7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff919bc1262c65bf099ffba1cc1171a81ae9b982 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b97a7d842954bd178128e050af580ffddf08a08573df4d899955e68b753afae2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e1118e7378c7372e52fc5d068e746a4410807cb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02bd3e4dafeef05e30fa39ff0ae5e5ab38c3995e15b8cbe07e7add8653b46c32 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..94c8d982116354643074c57f07616fd1ddf0cfd5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0125a8bd5673f17ab5f129796f163766beb5d2966a1edf59fdaef3bbeec1434e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21ad48668db6dbaedcd7ea016d3bba1be5a4fd84 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbfcb8c761e4ccfa1046e2a5781a71dc961c7dac5bf25d948549b0ffb7b89e39 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f21de420f82564f5587dede01cb98e6705b02d6c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:633d72df944e9e02df7c56b6d76cfbc357ed9bd836d906d83c2eed07e14749ee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94b3acfd35f6523bc3766e9711b0d44b74f36a09 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75dba044d842efc650e7404f167c98efa6de877b34c9cec4785ca485c0d0ea6c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..250848ce7cd2f3bfcfcf3aebeb02ae2e4bddbe8b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:751674cf7db74be43ddfffab2d7c354a474c530b3aea66f3633d70316cdce12e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eb928f3e6429c299c0c288fc1235917e0adaf17 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcdb47ff496777a183e163f48060853d1c84644d3695da506d06b3c2546ab1ce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4856c9489ef1b1a505587a9c9f1885e4deee4afc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3d4d4c4a23299b8641c66c9080a9a206f746e78238b33bb599eccf869106df2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc1be413772cc3620bbaaa01d47c7d0feedf3e29 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d54d0a4f6952bc3bdd6c3f59b1bd5f29d48c5b592dc1f5f62ac72f5deb33e037 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5deba6e63a9318cad1960266d77f5dd4a490866 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d7e0c6044aa15abb9b58264ad38fb81868de95d19338ec96d5b1dd4cffe1c99 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9545d3f533c8e1e6405bcb9cbebaef69b3a0b6ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4a09a192dd741c1556f4c47d54e10a64619f612680f73dde9d62e8710941b45 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11d7cbd2810aa34240be0cf049f236282d46cfd9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:442f28cfc2ae55326ffc6011b8e55cc25a4a3d4a98465c8a23776aac3e063686 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f30938f2a0cbc6c46f2cc5c00ad54723bbfe2de --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c64beb93864471ee0730de24397dbbfaee0d8421d22877d1a7eb4d85ce21d04f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b18bbbffb6f6f5ec1327ea268a3466458a05e2dd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aa22d748839bd1bee5220eedc5a37f481661fc1f584c5648c18631957893b26 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62c45649004ba548bad4bd6370d0fdaa8d19e964 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06e1ead98deed818ea8e0714d41e02cb3abd706a4e681351f162c609a77fb62b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48d22381ede9e844c324793c76aa22335e23f2a9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c29be1228b5cca2d708356dca4a097f889b99b8946070cc116bb08688e7fa750 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18deeac82f8c720ad4816839243177c5d26e2c52 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c222a0bf47ba918cfa222f72b7a6cb9db12606c234c49fe72094df41a923c2d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..691665e862d9e67ff1bc135c4f9d3b2bd92667ee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bc7b6ee4b8fc43733891b786caa4330afe3ffb94684331a7e364c11d0cc1bc5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d20e2dff9abc25d7febf0244e23beaec43d2155b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98f8110335bdf801937e562c7a1660e5629708b018025b6cc6e03d58854a93a8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4964b43e54852601aa129102489b58bf731cedbe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49344fda8763d979fc7a4ffe8dc395f7ffec3a32c13e3e8ba33bab175b5d630a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..afaf6022ddaccd6dead4269487511e398b056761 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:439cdb821e2c96ecb0ea08d845ab0d3b96d21ab18a38597e67dac5fe569c3192 +size 11395