diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36e078af374c83c2a163fde43e62e6ea531048b9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bb55a4e9e8342697105dadc3bb84eeee326b86a6ba74f7c504dc40e3d7de324 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc005145e25c79b36fa7c70fc706562337777648 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aba799f1632052ee914435803506759d7eff2f720800662e6c8865a3002c7e5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a7b654ee851e64af044e56b3c8c23d366c2c7cf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74e80df0d5581111fec566bc4b2f37fdd5ae378f7f8d7ba1e9a8ff3bbe675411 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..daa88f248ec61c42658c62b7f52b1130018ef45f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72ed879f84abe62dcc26be2e341fb2b9e5cc0df05e47cd3108fac93720e5d192 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ada2af7e290ebf482428f5f67a98dc8649998d8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9bc183bad7dd3d93f33135b6b952ba86c1185f7a3048ad243e9a68449162fce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46b46ef8a5684d8365feb6c0fb74e72af8089186 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c87eb7b36e8260e4fe053ab7c536cbb59da127dbe63a826dd0fb17fafd97ecc6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cee2aa5abbecbc4403c1dd51ead860494ce380c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f1eff08c6d6d06762ceedb22321f199d1a442e9faa3faa730d7f7c1817e3614 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0626dfc5451da7841edb0283411b32f8e5f555e5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea40275f266ee70de87a047c9b6fc7c95a1a017f7c83bd321f712dd5b61f857f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da4ef94941ad87705ee4b727a5df3aae715f074 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aba72086749962bcec24f284b7c458540a479bd83f7e7a5356e1cb2886de923d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1109deff46eb99e91f5ff2f8b0215646aec9572a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:254fa314dee77fc3d026a830844bb36b18661e0d54910f1a0474e8f1ea261e9f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a1d35b83e21f1c48f0328ed6d839d8eafa97839 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7c6756e17931f736c25299d8a79176bd3667285abe9c3ae68f9522bd2531f5a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51c78e9e06209831361e3b5b837c34c7f84785e7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41f115e1273da746f4aca92d4040df098ec4dafce9b012e7019e74689d4434b5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8d25e2f4ba55ff72a78bb071b69fd349410fc4c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eced5af8a33d49da78cea880e72cae72d0171d35911ce82756c39ad75079c606 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4b23e6a2dd93101b0e35c3c3a203d174833b01e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015c243c31d62729f665ee8b67802d2b10e89009e51c9bf3d13ab221279d3371 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c46c13cd8d42bd172fe20618cfc57b94d5b0295 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1676aef012427b62d5ad7fe9ec7b6e9661ef6fe9214072ca59c7ad9b5ed9be6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a7b35967407ff5cf861d6397f87621f05a953ac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2695a9dee986d62a93770660b62a37c2fc09555b34117cd1b3a7ba0cf7033ec7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edced55880f37229510789625784b7921956ddfa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b0d4155f2f2effb9767cd16314f7784da99ac5523933aca2f4cb8ce99e712c7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c0258bd45b16df9894e5b495e84d69fee529bdc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf93af9ab7216bbd44286b66ed1f8d727cb858b6238c3306af86ce590923694d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1321bd31537b79ea0d162094d2324012b2d0ee46 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae19dabf499e6911657b58547129e347e93caa34ce35824606ca8ebbdc70ace +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..67130768e7baf5c6242d3a9daedd4df56cc292a4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9e29981d675935b102f0db11c1f0f07e8805fd30d319de71dc485ba0aab7f25 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f2d443fa5cb11d6ccdcf3f9f2affaae60258859 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e4a3b9c91bb429cf8ea81bd9f028e0aa8cd39e88580ff5a7bffa8d7f7460bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b414c6c9018a0dcb2b5d06b98216ad009d706f10 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe8c70a75fe6e904d440d7714bcfd2bf13a955821f503a73b803e7cb59c280c5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b6dd79a4bbdcfa3938b81b3b3f8b37c6ad6d057 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:012870f1ccafd17d6385e8fc4dc58eec5a6292f261779769d75372e5bc45821e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b188602d7d472fdb6812099836743f2d447f28c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eee411b74e4d053b2a2c848f6e7f2dcbc4041e154b9c330c8b7895807144ba4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d418ad897149cf150b6d574f3c70d0061f9f0f39 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37cf77dd91dcc39d91c8ff67ff0ae81d8b01b063bfe40173c4d29aaf24c9d9bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11a7a958096bc6e006014ad8192e065fae171f40 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efaf48282be8f3e023d0a2b6c17325eba6d1265e76e4ec871c30ed74d3c4d486 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5df2918619acf36766ced12babc3d5b45bdb3d64 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e30290a2e870377c7627e2de5675f7e3e48b368c06a294fd84b30e8a9fe9022 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5c6877c8c70394e7c830709e2c85fb40e796b32 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea4980e91b9a91e56c99cfb14ab8f9ef797ada643ef5e6389c38710ca4d8685 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b34d9219d1efe5f211f9832fb89b174f449b1e9c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c25416b4d5651adc8eef96c9b091298e363b38a7a6fb40446f38c7bd0fa5e6c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4483dfacec03cbbdc3362e7015261a3c4fba2c5e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbbc075c564943fe2550ad26e9cdf8eca966037cf9560a13f555acb7da162fbe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61ca533baf3eaefd6370aea630ee787d71f3d5e2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c770223cdd23525f6f731b5f9a62353091084a39e06b5e8ae4975e8d3b7bef9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a26a5c9cd9c2746f4790e167993ad27834c6a126 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abd6c9436c22560a6d4baf1f8519a5dd27972760220dbea1aa5188fac87ede10 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21721d86c097fad54953c366ba2fd45ed992067e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9477ecdb8a8488a4aa7976890e25f4ab2977c33affd27eef6e4d826198793904 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e90abaa1aac5145484837fa1c76152b5264b5569 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a721be65c7ea6aa3e0e44e8b7680c0dddef815efb1af0293bd3aa61a3663319 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1319bc75ee61cf9a3da14ba25c760d466cc6bc91 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:542ec6d2deedfb1edeef5adc83282efef673bf6e5ffc89eede3be9ddb7a44c06 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce1db0fee13561bc643f43e24761f43886a127af --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb95e0a84a2392066b453883818c0f9c7fc5bd45d4f29180c62970a0d258f8a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9c66cdc5b596a3f9bd48e8d052e0315bb35f789 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb0053cbaecfea7bdc3061e9841da69411d0c78ea78965be9f78c302d820bc01 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d4462a7cd6a840d13fef5efec06e5893d7d634b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f44439324530319bd954f084518c7ba3cebd0a9a2a52a188fca0cc59412ec3a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25898a5ce074d748d10994f781074ffedf450e61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edcf5fba59c1e31c57a2084231dacf62b7def123423e4f89dd92b55dc91733f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dde38394224c3e26038736c6bfd8935cf69f5707 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55d582d067db5eb79d1b7b929e797aa3f4f2e8bbcecd28c04ec3a010c8d6d55f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f35cd05087f1b6459606fac51d77151aeacd62c1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f54c07cadf455fc36a75ffa44702528211476b512e61103a96cb0b2a5f2196 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ea9b661b1da210e3339ba44b4fba9eb75615a0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eedbb8676abe42a789b662a71315eb3faec5efa3f69e298878d2124bea14e316 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4f5b23403e8da079cf0454e20dd30cbf331d916 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b5843eb81cc13963f59ec5493de6f5ce85b9ab45d31ace5b5761bfd9d01983 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa6e4397c73a7033fb655bd7aea7af5f13dd5ec5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ee031c6b42cdd72087a8eb698dbb8d9c6354a68ce356de2adeaa2178a6d5869 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41f76467632cc6a527d59eeed82cbd51c873ffb6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c6959c4577d98ecd6c2c4144fe5145b94d5055e9cac8012db73a0b2a26cd12f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d05d55d0b8f6efb4ae50369eec021e910257b3e1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67dd412c6692b619c3c647dbab6d9786138925843525800567993831dccf335c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb3614c64a9f7df4197ad52f81d58983a967fa3f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c16cc640ae2da97979a0898773fcc87c7806c4ff3d809b78f0ffdd9d3c8c8dc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23b133b1900f28f029afc1d2c6b7dec0d56ebc6e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1a6b8802d52b174b4cf595146e16d3870ed80ae160705b68c5df29185a00858 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b471ad8dc356451556c44910c92128522f3075e0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95c8aced4086976709fc0e528d9af30e74089920f10927adbce1e7ef208ef5c9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc6168baf89d88be0e7a5bf7203196e446575fd8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:630a297eb30f153b11a2ede5ac5f534dfcf4676fcd49fb4e587b02d52a376402 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bc9f7c9119917c7535f87a990cfc2c7216f8334 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed0bb05e26ee1d86929147cfdfd8d6195d060a25e21913df33d2a065c0f4c2ff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee2d234f46fb1fc55688b46dd5aef0fd7fe3f5c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8358509f681422c534daf76dbceffca72b2c12f3332d22f8315e7b0991d12556 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82a6103931800aa1540f8c3cb7143fdf9a91f3ee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5731f54d85225f860f239fb310d5f925e92d90e5d9156c6bc863f5518c22e3a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31fc2f06ccdd09fc596eb5829823761c97c59956 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c34815ef1d6772ca81fcdfbc9f218d507e6b9ce92172546b35327821cf1591b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa777987b165f0b50b0894f22503a98eb090a8a4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4275791e479b056169f0edcd3e64ce0eedf34329965fbf7aa9d149ff4f2752a6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc435bb90752d31cdc9efb45c0c098423f542a6f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa4e49786dd97dec1beac93138050324af909350302711142363c8e284c721d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df53ee34be303ac8894677e13e67056d715b6f79 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:592379452a9859fa0eb1af2e7b8e5b80ea62eb23d4527fe180b956504d9b7947 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da55158c0c1cc87432f94fdfdaf30afa8b13a615 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0ebaa42675047c13048e99cb1d690bd5c1ec1bc76606a719b5a464a5c40d966 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed815dda1a746e301340ff3fef50a61dd46a78f3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e289d6471050e746271b17c1c02f2cc90fcccb418705756d52cc43369fdf24da +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f420d3cea5414f7c4cd83cfc5cde29df8245da64 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17f60d3227154b94ea1b00c557cf7c6400f223b1a0f0128dc66912d486a9f678 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ace16076a7b9240e265cd696178b78315b86e790 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b685a93375e04bb7c98cbc2d90802f7a07b7649baa1a709a13a68fd2f1df33eb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08dec6df1806e063f6c213c43c5da2e9c7447784 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21271e144a7a010f591e72ee5ad34fa2e0a6d22a0806c48732a1e9c9e9ac9a90 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68bee7dc99172317163f0154273745704244abef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b528ad045bce9bd1ff36581d6cbacce62e85994b4d9661bdd8868c9d7ff196a1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f0880d7d743d20c94a14c220a166c3037a803f3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87c62895559235ecceaa706cd76dc02f3ddf2d4dc345cd0b148ef3c1332568d5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83745134db91ebc5062627d8f1451cac5109b622 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3b466c4739ea81a9b5f6d4f29732f4725f3604bb11e87b856083058b65f7f3b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b06738ed829121ef4bd577a3c2741dce83f8893 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039be7ca2162a160213d50fab62a47c286ee402d8f59ce611591ef288886813b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2762ac04c654aa0805d07dcab447725496e1b4ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8882788523828981e3d3f9da834397202c897a8b2919cdbd35e63274775306d0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8b4c448affba046707fd7fab6e4fdda1f16dbdc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e50074abdd4a648f6930984d78b6dd4e922a1ab38365ae8c6f75eafa1155ff3d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..837d2687e56c746e9537685c3f0e7ee997445b64 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3e2e60b578f1cbe4cd48a4d565851590db0abb73bb869015e75a1214585a76 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e88821c246540778994e70e144cd933de388bf0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fb333eb6e9b2b40afd64ea115dac2e9497fbe040008a7db1ca58570a936de13 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d64aa708081c196d8b313a00a9e131bed140bd61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73d056e7b7ec100079debdfe979b9f0568bb686d9f29b4c0f093d47b290d0f7f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2616897af764a14b5f91c89b7e038596ff29de0d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f54be12db1bcfa7d69b00d2a5dc763cb39c7ff02d06aeecf5c2f121cc3059b3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b46bec0c399520999b43fdfebec42cccfd9a382 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad2cad61c31ffbf7fc621d8d0d9e028ec62696541a6b7aa7e6b00369bf84aff6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3205a4b9bf7459679b9de488e6592e0cf8e3a864 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5292c8b6c949723fbe45e54bb178b0154199bcdd2246e96769fc11a4facfa06b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e007ab0e11492298ae8073d65e8629065db0650 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3dae46b3043e314ac2a9a00b8e5fac65975e52226141be74bd53505d7dc0cff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92b4c63c0a799aa75e3b37d4277a9ae6976cdfbe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb5c5911467b5b553bac4ed50efaae2f1d97a220a56cf435de94d1066e89166 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd65da39585183a2eb61e32cc98c78c3ec35c21f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a8678d7d0adef328a1d1c6b0cd0e93188671ff2dd3bd8aa39ea72b4b6aa273a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d05c4d1789e4e8187a738a70f50de458a7224c2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a8906bbf79d6ae66ad60c0b63f4251fcf596ececd2c60d44f3646c051d1d929 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fab427044ca503228aa7a65b55cd3dabf96238bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3328bb96a4f0c5984a8c229a8d3d2a11fce35f5375cf84adf035c00d4be1684 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2498b0320e77d43d7aab40b8f93a8c40c30e75e3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfd3b3be327168b1daa6ebffe2dd3b2c6bb86f40e84a916d5e85c902c105bdb3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c407cac266ca0577da1c445031fa19847958a693 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7360a9ed2b18025b11101cd1f998edd634439890024ac0a8ab193b90342c0a6b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b006f960a30303b647313de797781716c3d6868 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a920b8344914294db14498cd362d0e7c6ee8cd5b4659590615a87ea2efeb2ae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a5cf1813ad040eff72b1b6d4528b3a72f9bd170 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0c5dc9e6fd69cad0c52a956f3fd56afa1dc538bdf6e111c86342f6ca50c3928 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..283021f27a8ef2a0339e8c15d03e18c17dac4666 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63b94b514e9d522324387387347cdc5211f7419678f8f18e9f58cc1431014772 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f092ba6d4c448f2260ca3ab4f4066774a1add32 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1d36a6f8a5d36fd4ae147b4d1c33b1fdf793586afc7c7bb0ffbe7c20f0c7ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dbd6e03dd4dc1134cb94be88c14293ca27881fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:887f4596a94d0a0a7569b9be33b63061baa8e9b2413522a56e4bfd8a5d0f480e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7eca82f5d34df253d69e054cb6fa490805723bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c37dfc330c0b54e1050d24dae4eccc6df22dce64f55c165f3a240599d58dcb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed3e0544934f768e8342650642b6581395daabaa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beb34244d2bce131a8c0285a7af9310ac5e0cf8c94be5c8147fdfda4d93ee7af +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16e149a3e03087ba64c7c552540d7f839b2d471f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a5462e2b7a61a928b56b0eb0a555899fee122d51d9b31fa1a17d570e5a21ea4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eded5614c993f7b74769ed440e04ad55de5e7b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9a8f9d8e537da700f6c18f501f573741df905d2505b4d4aafe6c4f013dbb63d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83fc15dcf7dad6d0007dccba3284e3ffe52b4555 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ead4615019abf06841167d1c5613d03807785a72d7e6df8de8dd77e75d4f5bf8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cb90c418cd21779bfab09b6ebc00ed550f6721f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c21d9a78bb84497b18ccf0f0f27991435ffcd91f34a1b0ce7487b33586b333d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a66563360185a907194cede7866fae750cec786f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c2a7dd21bfa832bc0c05fa87da281204952f202771acf70906f341911d8add1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3ca6b6c866752d2dc8898b0735af8251ff6af64 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caed2ae762df2b8f2d85b3e2fcec226e8830694ffba07d3a69a16ee6c0fe5b07 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..840eeab05ff8880fa3c357a52e6ebd5bbf3a1c33 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c7d6d909a23e667485ef3588a3d17c0efe31479a6f1391d6ad972e598df6e2e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb3c50976ff983841e68a74b5c3951e7020af516 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:177488326d752659f7162faa1f0f5cb55515451b9992c28e515a00915196dc4e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f16d4a310f64b3d280b62532a3e8976589d08d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f610acae1700c9f0711a5aa3a13dfcf626a19a6088189e3ca4c18b982bc670af +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1bf9e845041a47039371dcdaf0009ba26e7b931 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bfc0f786f3843e06cea84e431592b2ad1fc65fdaadb0042585ed64e10a82d2e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28540aa84092313e9330f93ae2d87e7c67abf0fe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2921580463891bd832771e60ab2e8485dfbb14b39d036676c3897aa936b865c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3765a530b87401fc226274da70da5dbdc91a9b84 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46753dd2ebe18d287290514322993a93d69617bda0e95c0abf9495340aad0412 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0beddbcf7548da775b65813a4bea21ee0092c96 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eedefa0560c8eab20535eae10c317e243575b849cb45bfa3fc096264c499a204 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..acb9056c7d96e4ece3e50f81b84df8528e10c6c7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e151eb5c319f929103b867bceda16edae4c820f77a6e839312ca3d51bf59426 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4005013f7fb8ef53cb11cd78c84dcfd8c36c6678 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e5af756496eec7b287f79ce743258b849931d103d3dc2d491c05d9039456cbb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12afb24e9d3ffb36685e95a7c93270f9438c28e8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c1839539889d380bef591cae82fedfed8839030b9772a6fd1b64b411332c94 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..938f8021c6c0b30ecfba6d537801eeb81e819cb3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c40826e53bf13e1863cc402c19561a0d62948a23b5fdcbc81d883eb5295ccf37 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..217075f402c6a05aef0a891ef21010eac3476ddf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31171dcc15d155c86a73732f3eac660af6f809280b80669332b5f78d21101a2e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6893308882846d4d3c76e9cc17af60f58e19a0a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d14d1f885c9c6c310cde7b1db58a55cc054395af234f0d507d274eb9240e925 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6822399e9ffbb174652efdd3c6c8e19b8786537 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a126817a0dcda3096f6c12ba0c928ecdd46f24a8042b1a68613c3edc93edd516 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ad7feacfcbab0c923f5f0488b6cb45df3224ec6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2fc9c603504a2755af027d0de4edb1a76f0dd3cc13a1a2dcd4ca8c377dcb654 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db07ec23ef3ac203deaf36b8023d1e6ddb726869 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e1416c495d6b61347d7e642e8d8465d4e43ddde9db32529739fe7e35773d0b0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea638ba6b605ea52a63bd94a9bcf7fdfffb7997d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a330c25c962500134c7a738ddcd868f7fdb7d3d4a8341a6d4f7290f442a97dd1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19c0140f4cd795828b693752f8375e98df285a13 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21c27a836797af86c54601e3b12fb991002c33d31195506433d0cefc17df339b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..247a10f8f4fd5980cd9b224ef04ef5e8398ed6a5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65936e1d9b0b67c0abd4228e71c8f3d4bfa24d42e973936170c8d3649c035a82 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..671e9f0cffac5bb42b90e6e2bdb7d243fb51f3e5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e23a8292b1a606a2107c2e203eff7598ad95b17ab4db3b38bad6fded9ca7c9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fee12a7999b42b9b2712812ff5036f2d1ffeca3a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:734d8184599121428039fd2eeeea30aec4698670be2ec58f738289f4166df930 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44c0554b894259e1a63f79b581f74bb2e0e8482c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea495696bd3574aafb7122a0f0de36c8cf97ac0a0afbf94e737d6f22239efcc +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c45f4521f2013e23a21bd966d1cbf0397f7e3c51 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2321b99ba8cffb4f7586b5561e635117446df34555b7f02fd369e0ba972ed695 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d22d38957fcc9c72387e069fff825b4f3e3c9473 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea8c30bc047f1b9215ddf4017dc6ef78d0dc9613fb995120d5fe82b95e96424 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47a4a1233848d943d07e23d490de510a06052d1a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d7ebe8f3a63aae540b4ba7166a73cf0aa48620429e4e306945861b99c66934 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0783d9386d683175b73ac1453a291cb2f00bec70 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc23ca3934af566054253a1dca5d0e97768b94e419bae7bf5a68fe1aa4f8be6b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b4f8326157aee1b44140f8313c9e53b4eb54270 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:367c7630e13d74d9e7f4de285bb1d3a64c68006513d78000bafbdfb214e3fb39 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b185a620f3b89b1552fecfc1beb6ce800b1da02 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efca4a1df1eaa7274db62e72bf2b5317072d717bb377e356407b72777e142d57 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79e0f3c3aaf6e731b839b0507d95978fe2874082 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a866207b6231a0281d4bd6b227472d7e01160576f0774300ccdbcd7e53d0b2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88fc67175323dd1fb1e8ad75c7d1a40bae7d2187 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31846d231ecd29ee1236ef3fc93bb109414707b6043ea7b1fc69e450605bff19 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15ba4d775110c64e22dc1a394057500432220c03 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b056403ebde5b7bab6430ad35c4f7d51be2694b28f12fcf04329cf297d73a91 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7ddac35648ce0aba3a3eaf884bb38792925a30f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b06055cbc7fb0f936971972e240231e1af3f00c69c37c0399abef16a38f63c54 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..678778dc7d100947115060690e5901e167e514b9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1c89d1760053f456a2e313e28b624a5cfefdc3840e6f35300967b1cc882355e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5afc3cf625b4caba4d927782737ab67ee51e933c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6b9122fbcb52fce584d60e13d20f8c20982031ace71987ab03e1108471df710 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79d0902e8bf8e5b3b642f4ec0d665220c0da527f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7839085788aa87e5ad712c79a4502a051076dd11256c0870cac8acb1b7479b0f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..486c4fa9d0d3dde665b7921891cfd707356c04ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8063c77ec44a36e8711adc344e16a6757d4a500c52ee6fd2a4fccfdc3010c1a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47bb85f9af6a8f64e641eced25df7d15f77abd56 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:418bb033c965da9af7998e3c50c9b48e74a4f30005a4babba696bd489016941c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff15b780dae147af0be1a84d17b6b7d393eee5f3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dafba239792e7a9e4f3f5b987a848a30e41d286a1da499dceb4a55a554eec51 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39762d295cdbbb34b947b5aafdcaa28b1b61e84c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f12721abb795aafe97d4a5d7519256041a92a86f5c10f99e81fe497d9f1b853d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa46a783cd2b90db34f2a2b96c669392c9a8c948 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66c4c3923148b15c5f19f19e8d50992a95ae504895dfe54fee0d07af9c8a70b4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba7dadb660bf1057b3c5f9eb9a6ec9d90d9d6dcb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96e056a016ebb27312701cb6fe0e5b21d1126cf18d291e2f0a2f3db084a20807 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12ae46cd53bb9929baee05be469eaed18fa64a5b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47be8bdff02ecc47f7f61e1f8de1fdf79bf1c1184d36f09744e2fa2ab73e6bac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75c701a49c457708808c0345f85c81cd056f2763 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c430eb61f4e1b5ef41b4542c32dc5f4e32bf2a3f1294e17607cc400894c3239 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c24050e98fe7e0fa35c1fd8e26ae06649a0513ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1645e2f94e5c4aeb866f23e26d4935e04901b1c00d323406df4740e8770931c3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42a39c7de4c9017de13dd163652e52c4191bbcd3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1789372ec5f6af03040c68610bc239f7ae247b464e2f78b2ac1e7c0beb56bdad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07edfb3890fcfba3822d2337a946b33b9337f9ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bb45de62d652f54ff1c403253412def48fc64fd07069bca9f0a656728642d04 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d9e9455fa3673d270d4c40e46c3ee46ebfdad2b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d74329919955978d1dc1437e9111405d595b4f4600f18714c1c2b910dca3a67 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdb75a55b8d0d7bcae8a2275bd375214523cca78 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76702c448475ae92527257ad9c61b24f3d43841262c6079782b6a143677e6446 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4961c280eb6cfd21e47097c898dc0f98ac87681 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ac448d8bdd6ce45e837cece031078c093d045dd57ff05e1eb002f91da2bd169 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5dcc31628ad33e097c99bab564587bb336122b2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae342b09704aafd99a2c645b542446bbfb425ba1bc079a87e0a9236284b87e05 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4da9da9f31dbe4abe3f0ad7ff106544a2e659fee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2210652409a79ab5ee2ee246aeafea14847dba85b354be14eaf04e9dd5a97e6e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bafeaae38bd46926ae47fbe0b247aed56ab2318f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ceeeaaaef47c4a59b91d0e4d9eba07c09113852e73dd33fbc6827b6d3068eea +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a99d877bfceb83dc9303e884d720a56baa3aab98 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:232dfaac87332c86035a91b73dff9ad71b8a2fbccdcf38c7a314e45545f4f875 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06027ce4eea66f1bb57b56a2d79b4e4cf39aed7e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f36848b2a9f53b1943bd97e4a9c73ede0a14ba95df7466242671c6471e4dd5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae82327daf39273570f8cb8cc749239be3628474 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e547644abd7471cb090789d544a6c7425c81b3cdc0c856c301e370f83a40046b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..522a6fde9bdeb9b551a1ddcc5772155e79659c19 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1bb5d4b43836e73cc068c4aa86ee3b8736305d50346a1e7e1786450bf17c7eb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..217caac8739a0c0da38cd0de34cc440f5d0a72ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:445f3f9d73c064936bd0cd55acba86bbb84db81d6a71d9d36f47c92b8f4e7bc2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddf26646e78f554ab1b6c6f276324a2b87836100 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9a77a13a766d2649746048a9d2a53e5cc4915b9cac502cfc739c70857a56b15 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c63b7d0a76c9dc67ae9137fec68d91ac430f7cef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2e1ed92383a6ee86b125b4b880f9493d6660685fd38171304d9b19cc07a531d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4586ba900144d4ada7e77436c8785cde5be501e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4de781fcae4dfafe69a0f2b16380a874c09db8bb9d13a7f9a98b87237f1c133c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..029b47dd402b7d2303e603e6c8601554ea6ab673 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54365d11c9d660b2d565770f6a9b0fb14a404ea7fa653ce7466da2fbafc4c66e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..343165431d793af68ac363f8959dfa4bf8890235 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:650444038d0125bc6c14d5b8f174b15bc4a69064daa75ac8b91cd300dbc55eee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e5a0d57a2c25280a740f8d807fa0e852130a392 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b36622ea4ea1523c35f14b244747dbbf675c49309e157ea613105c8db54d369 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15cb35c39c556ea08acfa55a5b04a17af2177c8f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f81149e58e94035269465b18fde647993d0a414c419cc53bbd86cf209a028c8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cb36e82ee7048a53cfe2a316e1ab70ee8bdb042 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a92ec1293186c55dead0cfefea35d01585c851b247f92f4abebbbb39e82937c6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64b20c2d17c1ce3da3a138a2d05a4115c30337be --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56acdc601036a0db71e97e793f5477de60f7f5769a02dd116fcc5827e7145dce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a115e44cbe49ff0a7c9fe0a2d67bb7b994480b6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d6cb5c18e96e07f7a58c018d8801cc1a2f426d8b7c1364d02efea9bb47171ab +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9b7421ddb2c8e44b0f66b8fcef447a755d49cb9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2336fede07f4b73dba9ff3b613d2ad6eeba2a5ff7fbc8b747bf9bd74bca309c0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68cc8f2292226fe31fe35584189e1850917df256 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54171eb0151543b9291d221f95abf995c84cc06a092fc9b62adf190458bd7d32 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c523732d6976900ec1fa0df8c4ae24b64c1d942 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56925242c784711be2a8b05762d0e7425c6e784c11a55287249c3b051bc1d941 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd3eb5fd9451e705551a262816fd85b61b6f1138 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5663edd53077adeece12081be69b0da61e22c1181716817fd209c7c430854b0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45347263e7c175f969d14e24482011bf4b2ee5ef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3e596e265affcccf7123dd261ea8ec4431fbdd727b94782e7e7bb71d4aeeafc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..433467b649d89bca1b28619add5fdb1d1c2c16ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feedb824493805aae7a6a894308658d4d1b8d7bb57c29a4ec58aef012d6eb1e8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c085d77a97642b8157c0da6ac30401fe8913e6f3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f301ab225d01084a43e7c03bba0790fe2e8dd1c4e18bfea7b8560f07edd45f77 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..020e3e56cfd5e12b679ad97b379054bf8c4f6fa9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb76c0aba9dd0ad64e3aa1d880aeb35d04fe35d8b172274da06dcadbf8d1ad27 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..583ebdc0207812300083491c2ee5bab63da33e6c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47c5538e51a2ee867110c4371cae700d5c957faa6edd4449458c57b6c2c3560b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0b47dbd1c88bd347c7d4e3b0c88bf44b9f37de0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a75e4ff93b5c2aee63dfb974b26697666e4fce554c7651357d618a5dc84f2d62 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4079874801437d9efafb87c50eb6d1989a954657 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d17dd37c8bc4bc62582f7b823eede07cc7a7222667fc982e4a118c477c03871 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6342f6e4e8094fd0f1c9d5587f58f886414c7999 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deaec30b7892d0e810690dc791947508dfdc4407482f48a9512557d9628dab91 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..593a4f0a7a710508d1be73f0f63b099aa0a0c56f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd81c3a4e4053b5d29a9987f9584575f8a21a293e1ec0118469b0756da6ef718 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7dde9b8f49b0a602b45faa1a306f4710d86d4e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:802a37a109b4e01f0a176654721c6889233f09438add005ec995fb4c405bd057 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cdcc929f893352820a7fe6a15100f10df5b9bfc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ec78f10afd9e5e982d92c35e8bccfabfc88e50fef4066fa36ffb025f536bde8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..341233509d3bb5b294b86c0806fb290864de71f6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b20c5e8a37bf3b6015e42137da21b1e4083e7cba254b4ea049d0efeec01a1b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0917e625af96e6d0162ea89fed8e2f431fd4912b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6981f395c1fa05df7ccca53bd56a6a189b006c8fda32707364f7226301ec0350 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b4dc66cd80fe01f67cec26addd09bc08b916000 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56f23ec66c9d4d8d41ec597757a7528286c1c6349e112f1efedae570a2049d5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60789769132f954d012800398c28e4135059dc8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3dce1fd6c902712a56464d541aef6db7f1afd634952997af178a26666de9eb6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e730d2bbbdf23297671dfb5cce630c290c277030 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c15addc032df8d7003c56307f24dbaaf18b959e1f75b5c85f0cb4645d47ff72d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e50841946f6e03790ef32a3c9099ae486f714b6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa3fa578036355e0bb40d1ccd3f8084d97c365f93fadf3e91cce89b6579b5cde +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8df8e2ec5756f80116d8576559b49b97d42a7959 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c3d7cfc09cc87be9079148833831a074a6ed1e673f4a320eb8ccc5ae74e8f6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c8e78c5a0eca6bc5bd825a315f73a8d644b7332 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe9af7964fcf869df015452914c2809f9c21b36375baacdc3ef97d58ef327a83 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d24f4be9bbf956541f7ef92c72674e827eb3fab --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e048d990eef1343917e64fee5858b3d0e8998ca27b3058e110e46503f1b8c77d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e023593ad7d6d426e87457e1a7ed220aa9c021f9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c44020a816c9d32d0af346e7c4364c4321a4f1712ed718fd50120bdb33a92c3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8826b6035d13c4345500b070fb8586c87bcd6ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:241db0e30dea6ead2bcee02021e3612b73a85802e769ecd56313b2634147d69e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe6b0e62d6cbd50a26c1c271cb65adae4799fdf3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1872ed693bd349f7250cac18791cebfaeb5f6941eb36d5e1ca1db4257838ddd0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f97edc5e5ddf07720b4cc5fdeb6405ff2fcee0c9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94c655aa91e6ec475f85f83e67e743a907ada6ea0ef6f0e937fce279b49f5dc1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b1ce916192e31e28453781510dc73791a8b8bf4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:970ff2cffd69ede8dac94d087d3575021d70e97b8c390ab2b0e2c3336f01962e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80ca2af74df09e1b252f73ba4a603ca983bc7a6f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:618a00a4ca325b9cf9702d55c9f45c9502aa86156ff7d2fd5a1179ea9fca241e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..991cc4b23d9bea48d04b55b1035e321dc44c3d78 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c849945ce445df8910702506d232150c2803435e974e7afabad4e8dc324982 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1883aaf0ddc61b91af71dee7af92a36c7cca0bbb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a6134e8032d43b23dab5694602ab2940f40929159b50c2d00e7f91f4f34ee0f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/lm_head/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0664ebc6dbd451253d32c03231c9e5cbfc207dfc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a42860737f6e9a138ce46602c0fd0d038b3390f3053d2aecc6c24da08872e02a +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e331cc55d65de4cf5cb64b4327b6aeed9ac9b9f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0762fdc8c9c41cbdb38513499c42b0f778c2cf7ae3d546dfc8349600a71cb14f +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fea41a67da9a22b063bc03bc20c94a970356482 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f11041752ebf612310fc7e507efeac49466380ebbd374911f26ee7cd6be82820 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..373cf0ad4de4b9ccdbbc4062311d2e772729f94e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b9dfaac7c2a6be876a0b95e2688f63534d9693b1a9ddbdad830c40ac392261a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea3ff7a630bddef62f425dc1cb6a7cd409eabac6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bec6f273c563b9ab8adbb5441efdc3974013a559385bd9875b48ff688caa213 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8caf13d8ef3da8f010c736d3825bf20f5203358 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00adc3f803c2bbd3192b25547141c06c889792fff79b55d30b7810c233db2551 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d835d3fd60d9d414762aabb26cb40d6c54fb3e1c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a85a69dc9987c28f0e1621e69a908234983bb913ffe26f71e219da43c804e7c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76b63c80d90bf3ac6dbb8c2e081d0faa1a5ccc99 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7974c804bf6ee6473fe43870b00ed0a1a5d73b3b2aebd089daaf1a451c04d15 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c870a0133fb466171e3b996cd3a24b71602480ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e91ab08c76477db259324b5a186064cfedcf39d971e125519e2018e719c160d3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52519fa64bcf855e2ea17b5fb9716cbf5b1b296d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83fcf20ff01f1e038315d35650ff2edea6ef186aff35039e9a946e850bab6478 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2092b49f9dc0d8e4a81ff5d081c4932a2d299eea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3188b5832e87ea14ddba920d8bccb1a023a81e7a58e387a83cc3cc64c1e9ccf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80c44e1cb0a7000ec5c8dbaef19be82771fa1a72 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5916760548da5b3a03148d2c94094c28851210a3387fcb3d247cfd726d05ee6b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bee76c60e01dfb26606a647ddfe470fe760c2754 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87a9117c95a9355e95403b4158dbb18665360bbb6a39c961b4824c0d30d4887d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcaabb8703e11ad673e9fe9ed45ed1005c1d89c8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47a1a9b63eed35ee5ec08d63e3f622f907655fa63c1bd08b8dbdbab233f33e48 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..49cb1251adf57d1e30fa12bf31e4b821e695a59a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8251b3e25f17f2d7701f4e1528785b47866817c378c759b9863c7a1ae28465a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebddfa8c6071a8a72f5aa8d5d23e8980259d57dd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3295cf7041ad92772f4c231c75dbb66d7ba3b525c2b82e1aea32d796d533ccd1 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ddd7983465fec00ede31796632d2185e44da94c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66252d64a0d5fa9097f6bd01fa81c4893bd7cdfe0186d12aee3526453666f4d3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef8f65f9a1318c59df9a594025bc960b3a9fc04d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06967bd072c0a743c36d977480f5ba6635cb16cc49019580b73b053a5bbf840a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..baecf8b34a359e49495c0c65d1788ae53947d390 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c9eb4c0ff48fd707287f2691389fa744842995e499b8ca2c952107fadd862d9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac04b902a5ce73355440da2218587b60e5775724 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cda3d81c547352ef6d1b7195f8fbf015b68a5848cb035e84798b3b6f4c24009 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f27d1a2e563beead20a4d95540a405a6127dbf43 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04e2fb611e4189024e63dd83f2e73e9af4ea0d97e90dceac7c3472d83819b611 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3919259480ca0bc564fb44331fb8d166e3bd79be --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67f0ee0da293e9f972113630939951fb37a3a183b39416e83e89efc982d20f16 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..37c4347667bd6af5e70841cd4f82c1a01a74a668 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e97395f579537fbceb87a6b4ef10d2874d049e130b603cc0387454a526ae73 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca6e2b55ecf84cea0e41923143b8345ecc5c083e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5731cf0ab1a0d391d1766b049cb298a0234bc38588ade21f03c09ddeeddfd91b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfeadc96eb7a3faad045bd8a9af19137300159f9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b160ca7488b9eb9950096f63324a2fc356a1379ddc8949553b66c25ac2712716 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fa40e764c1fa17dcb2511c92677465baefb2ec9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7165e3e5727c0cc7116ccee7c89ba440a85c2843123cf0dfac8b3339c89cc92 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f3252fd9753f458a57ce0ec414ca82f4b8be15d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d20e1cf50da01649f8ef9375b0e17560fc3143bf4095472aacca20776fc12b4d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef10947c14e9ef7a8159034c2fa6cd237b378ddd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:954a30df350e00af4268a73a4b704f970c2deacd6c1c328b6d0919e1a86cff95 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7016beacc9fcf4137ef5c8396ff2a86c9c4bf52b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:800e514a76acde082e971dba8eaff7272eb94dd2e4d0ee47ce52bb5eceb1bafb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0816aa15ac3853a2933a3d0114cf2402a6581eb9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2efbe5ccbd47ff328ae1ca4da4e5c58d9b29fd36e389076c24bc50c6b9b7a252 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df1a9164989ef9085387f4897c9be5b15f688acf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65d8304bb09c1a9fbd308ac2593770a21ef6fc4f31538ab470a743fe0a3372e5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..632e2029a583d8cd613ce61163353990239c92ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fa355c9715a00274f9d28622c15c8dd4266e17611699c307a16b2c2699ea63b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a2483c888fd95a0ca3b4d9a5f645510d996d1ab --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad791fe95810f03bdc078d23f123673bc87207051e4ddefc52a30b30530c8beb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c281e4dcee399df8d83165374cd202dd1cf1db9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac20340524beb39fcfc011b8eda33f282b135305278e8ac1c69b152854a7683d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a8b46009a954af0329fa376eb637c5f4ebf07b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43ea3287f71e607bb6464b4023216a1a03b36a6c2b54ef7ee453b046a99d4f19 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a20747502dfd36ea4ea3619fd5d37424b063662d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b873c968de1832c96381454b579cbe4e79067adde154d7770597507a683eec44 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2165175298aec66cd61b79c74ce7d66c17c3f40 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d0fed487f88a2b8710de0913e806bcad86ef1614a112da96c28192bb88d130 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..970cdc83bea212cf3969c73476544fd8efa27afc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13d558c978d6226849127fba80a2d93c240011bcf765c3c8082a367f1e268328 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be143e1b1a83fcff98630afb0edceb05a8271683 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87072cbbae0d4022b5a69f1e6ccbc3dec9da3ef761e732b021106a46c226d9d0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5980d8c7a842c405f2b8d4cda7b426583d1eebd4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b4d9c5f5f8965bb6cd18e186933cd8f637df65bbcaa1d5b33515ba21effd285 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aa04fcb30ea319f608f02a12b2efeb5ce194754 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32758e011b044c7b6deb4253ea48ebd0eee43f73f83dc7bdb1ae21eb40fd3088 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f62169373ddab76e115d1ad9ff27d95ae8f71a5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9884d135c578cea36b270486662914077fa12dda87d45f971ac766481daa175 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77819f4a83673b83c6ba01722c68bd7d9ac38058 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bcd2835b885222726fff2bf2da5cf270f0ced52ce1dcd5e8113f339db96740e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fb1623f7de4618e1cbfeda048ba45040e282f30 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:070a75e6c97de1fa4ff2e448e3cc05e10189952bb1b9f519e273d5d784fe021d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..639797a691e438d911cf0c05326c14eb529a4108 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5cbcee08e902ab71a0a8f0fea71a5c0a5691f6030fba5bcb475996b4a3a0a59 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e79a138f21bea97f0f7aa74aa67df86c63e89080 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4846edc8cda862b777af990e3c90ee39c9783be534be6b5b9be688a7573a04a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b26b1684ac2a6c493496921461d47dd4faedd623 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edbcb044ea014e431365114930a38bc45b3cce6675a71138ddf3278048a0013f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14047a70ee1ad8d3bc0f7e735bf2b9103675aa5a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db397fdf256afecd406a564b282d43d3377680333ae42bb9a4eff1234587d6f0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a6a2d4c2d6b4acd9483b738c9f2792ced5d2e78 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4beb3c75a4648695ec0c39c3dae2aea86c1535502024670f403918e7bd79f6b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3f66322de5ff57177bea830c47f340de23ac2e2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:765be12dbec64a4854a7f94a39e57a19d144616027b35a36183218a394230b77 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5015ccf07e8700f791e9f4746afdf064cc59cfa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02ad8004f29336e570d012734cf0159d03dd5ab6a3dd9d9621970c1a87a14ab2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d25d675f619ca0f70758789556a0416e5339f1e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95f02059923eead6b0242e70e7d4e2cba978c0c3cc5f9e3b6ccaa1b165bf7baf +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7996dec931eed87aac8e1f3689bf24f83c21dab --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caea217f83fc84af59aee1ddf64c1c7240ab8b7827b39e1103e702cee7d32982 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48cd9d7a83f81befa0fb054ee673b647c6121357 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:834ba5ee3e33e714c4e483ede55ca6d8056746ff1648e6d1a1c3c74f45f9305e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4f27fe4984d0d5fcd184376806dcabb1f831bac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eed2207bd3c37e5e0e5266c9122588fcd59c550983cc2e928ac2e96e7205c3f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..332a075fb8dda979a7aa47f0826d0a5251271a22 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4223d60faa54e4a1df8d6a2124f793ef08e5bf5e895ea1c531fe7be326758636 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf4679ef3f8130f111a7bb445878d4ef4c7731d4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:329d4759efb6b9104b58c97514571e50259789102b81e73c99e111b5ee48d3f6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2005c2c38c355417b6bb1c71a371415aa115c31c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94321f2e0ec11535f1dcc9ac974bdec91a1b1238de36eb2514331b1592fdc40 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..212b9e4aff1f4f6188d19c1d20f0e1e59c730cc4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:629fa12f321b3d1e120aa81ed1d7e3171415b097a75ce28311eeed6a0483a515 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca0833fbda50886860bbb26b66a71713afef3c07 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b33e8e5ec31b68e95b5c83a5a1608c25ee81450ff2185e0532302f8abb3b505 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..070abab022a8eb8d972a44ce07437485ee938d09 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f072f74f639340318cf667b199750545bdd52bf50051a615cc0339259de4b798 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..888e1fc073e223f4279ca2396a2ad24485532a18 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b259f98affab95a071c5cd4790d6f00f3b4aff1d585bb36679e109160080e5a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0414232a51b663fe776aea8e6fbe1a9d5ea6b8e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c4e1bc59a517f69ae8d58e7dc54a62b1fe9a09bc3c69964acf16f326f665a33 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13136a75263ac6990f5f3105d21f434ab79a364d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fab41af762bbd7df71cf36eefdae2d666d745e3078e5196bb5cbd0f2af4fab18 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6a5bcca2ff300b176dc5d52def38627aced07d9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8ffdfaa9af6bfc1c11a58cb88cffc01f854ec81090a01c68a40e49d36d77689 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa41ab5fd0921379a62cb21dd30059ae9db128c8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29f7bbf8ca4400c921ccb924d83c67cb3ff8d8f3241bda627ac21fdd2e6c61e8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3df8cb481f0be6b64700f20c1c79012ea401a3e2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9e504c9c27e22b5e4b18dc7919d6637fd9b8dd7e9b99ed39d53b7fc01b3db4b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06ed6fa2342512a3d33acfbf0408038054dcd9fb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e8f9cf8176f772dff8440636c05f789e365527f3eca3cc2c603f22ee4cc6a5a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0236a38e3b51134c86adab2e7d871974a14c4cbe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67237c066119c8941146c817f3033c7e368237ff53daaa6d3e97e4005e8e9048 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c83fb25f8a06686660a543a256e98ddb7a0e5f1c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7b2d6f7d053a7ceef972d3ecc2a44f0a94ca1107a9950f2f744721c0e4c9de5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0943c3f179fdcd4bf2f6afab8569a1b739e2807 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e19de01bb9f85eb69cd648a53be7215dd00fd99334d6d030597d51e799c03c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9330e1dea1585b0e9e42507a73f4b06ca97b2713 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd30bdb4d82f6306d2a17747b0fcabebed853779c8944bc4ab455f64aeb552f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e2b0cbf5d3318bfd434a10b11735c0be47910d3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cf2650f57c46a30c278995196d582fbc480586b170bfed99dcf505b48167c29 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5ed7bfeb723943da8d1791e55c9365b59fde9df --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6fc5d54a4850f5c3d1e725f47ddde0267f0223022469ba659733ad01557e9b3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e32c7fc2e7d8f25d6c788832b3621befa15c121b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ee1896d69eb67f5ff9fff0db354b2439f3470951429ef0b9a677e08b7b62633 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e9c41fa68a086ff452f3334545d311882b80fc7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56cdacbcd5f821ecd5571baf79f70cd638aa154045eaad3df9ec74218022d4d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..56104e8d555780b648c5f6bb87f5a2e9f0322ad1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:310654594e997dc4edf4ddc4bd1d9799341182c48783675e5124c7fc9db11b48 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86db1cdfce34e2b85ec53871687444d41b2db087 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c07b3a0edd8fa8d2c26cfec6be96638fc87bfa1e605137f5600968e333b03cf7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2c82eb57e5c7d7bbcc5479ae059d2e8a46971fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e499e0f0394e9dc4d5a3ecbb1ba1f3c0cd8220132a3b1b0c6bb8aefe3f2d0e3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..008e89e8ec9b59e403a3f6dd3d90ecde61aa5c68 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca95c73cc6d8b1f904f7792d9482d1c898a329438c6739aa8f926593ae308ce5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab4f9dc60e342be8362366d9483f8af2ac754c15 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea2c2cd7df3f96cd10f91ee827b5660f87fcc1b0cc7d38f36b8345d080e28dd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..352833c59541eee0386cc8ba8ce71a4090a2cb43 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a6f46f8b76d8a835bf292f76f5a439c579993cafdf91ae35b8ec767c3b8c03c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d3790479406fd967c6d1401ea3b301fb59ca45d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08d2afdf9284076c07124308e966abc040b61995f9084b4a6ca6df37adf2d27d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbc2bd42708b77353dc10bbda56287c261536253 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50ffcfb2d785798e43dec1281bef87cb01a294e1df5b15b31fa4003165be4c7f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..776afc9650f69df754f28bf0d098836420313b3d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2665b38d58b36eea522815db9b70950d3b012f2fc4575aabb61b6542c9821d36 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eec3af9c37d976636e7f9d20104fda3aa734c9f7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9ae0d9d9d02f8b4195c30409005e41f6c671da683ab241300ecdd9f293d1590 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c21a7eefe40c2f66fbe887090288909cdeb7ff0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07888836bef527510227fde11c9ad231a6d7613b6f98a9d9a4923e8a4b533061 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0d7fedd0582290f8d2aa2b7c968a21252141d1a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a026f99a6f195fc6f96e6d32d2d4a634289725515606b6cb54b073c789cd6b7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5802e22b06f1ae09a24d7a0158f1e8a978b39d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98af581bbc280b13e9be7f7f0401963d909f1b76d1fbbabf92ddc710ed244269 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..598d6c353a7b48f7f378f096a6fa132db0e938e3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556a68b90bff02d2a2cd3951a99ff9496b9f4f2b83362abdde0c014382553349 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e91e9c6758484a98d2154f029f638862b1b8ba62 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ee5f1f3175cdf672d4a911ab78f90e89588e70858a2bacaa3769a1bbe6686b3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d719de40b616672e7061c96e29050b59f579edd3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8595ce6bbcbd407052dde491ba336f7509e572660b9038ec046024f30198397 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a4b0129bf6509fc3eebed9b609ad46c1671fe76 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3f76ece601837a22cb5176f660fd8a4a56af9709691b30b3a108a8ef17a68c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe6cbd13b95dfb3c10ae7594e51e3f1db0bd53d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac26b2291cd7736ca32321730c0cba52bad72e93c109218e5749f5fa9f00fcbb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae033edccd9e21a16373426cb7183ea3692e0c1c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308e3746bf0724ba6bed7a213f74bb2e8b2fcb3759fa52bd050bd95fd9720d9a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f55b9db259d5e4f20b8f5b596cbfbc94bdf4133a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b36e661f5c1162abac08a62a0412802b276a98f930a3e7601962ae692bfb3bae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a21895b194b71da8a0676dce7be8d4bf9658dbe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef88a6eaf72038debf77f32d358c2d6e5c2e43ae4fe89f22c8d021331220a3a2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ff03d118405cf7a65eb99151cd84763fd66c599 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f47870e3c5e4924ac22d102b68b105898c032aabd702f2040842e85acf8bf57a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de67f46657e0ae226fd41bc000b8228d15cd57fa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c53b08d3a0ebb13adabd0ffcd5818277d578b8967a0af9415862dc489d84fea6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cb28ebee8c59e8dc0829047575621d534751d39 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fda47d28d2d09291fcb545b9733cfd70e4e7fd945bb64fdf5dc822120307d3e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..24266ff0efe5dba3f8162ca438c496f9359fc737 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f58fd1c22c6eb6be12fc80ec252655541b16f8e8244466a9a9266a7ab135ac2c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cefbd582911dbab6fcddabc23dd9aef265ca697 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da4eeb534d810a8d12d796963a348bfa306f732bb5f3847aa8cea26c8dc0292a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..58bfb1d8d6f734b2e4f46879818706fc07bff5c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaa48f4c2a0d31ff4ffb2a07be7ea22885769a2500637a2fb745932c40566420 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..214c1364a951a6de6339c1ee13c18233f8e65091 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df4aad723ac1ec4a70cb02d419e9b95dc7f5197c20c57d025ed43f75aa67a186 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..860804577cb8103121e3d4288a5adba9cb0035c1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23586371378df474ddeec5cd6e691082aba774af2297e461177b155f67e64e46 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0999424432a3f73032b49dc7f0d1adc1d1408d53 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d0e481b4b337198f076693ec1b4d719be689eba3ca510bf020fabcf42728d09 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cbfaba9b923d7ba027f444413024e5d30abe327 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:447c63d05785ebc4728c28fb103b01059919e9f98de710669ca845d22eb7266f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..580abb3008a66830b3b735f916529c4269c7dfc0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:317708c0b93be0cd2087656a4081465f2dcce034fe1990500211827e1c68416b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca308e9c7aa5f324d60e50b2e187823694b84d73 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0a1014fe45789cf33354856dac78e326b5f88b78f6e8d21fc0d877d419c0c55 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6553e987e9c39a6bbe91631b7cc40002d79cf75 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d7dd292d3d8bea96b798825791d3a20b6a55a9dec5340fb5e6bdb5487346617 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bcc0b7e7b0213978e89fca495215e5d8ef7a243 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea1f68adf634fb3e6c7242337fc10a9ca8ea57e9e35f7c9b1a4bcdda55a80a1e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..857d82ffb5b29dc70c7a378784451f18ba286671 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d19fb76c4a3a82d421edd4591c511a62de0b6f1cba8ca11a5a90a04a27f4fa75 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..891be434e896cfe1cc615f2a6fc44b772d771cf2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd5b0481e3d7019cff157729dfdd01e4a3dc247f08fc9a05f2040ec1b22eda1f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad7f4f2b815020345083982e460386d8213f7639 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eacfa4ef031e963cb5a3f978ee7c32ff030c0e7b94b0fee5f527da71696b9684 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f30aca608af54456656e7c7827d9497529841217 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8549c2bd3eec1e3a0f563521fac530f2d6df9a4b544e6ec8a0c13bb3f5fd6d0f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e02474b24a6cc45ad4480445e6ff9e38f9835863 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fcefe55df129c040b65ab89a36e82a6e674c281fb35cfaf02ef091cf55ad836 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4927e195f97d3f13721e67c2638338d7b88ba807 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00ee40d11501a98eeddd3357842a7f35ce19530dd29bd4352fe9ab7c99388073 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2565005270a3274d3f98427fb69728b560e5ef5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e044c3de26e4d776d4f3fb98f409ccd73ddfc853dfdcfae16324f192cf8d710b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a116d6a300c8ff9b396c4b30e0213830857dae7d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb3a1a321e158b4522ec9ae04d9230a97742d55fba25a4465cb85cc3417c6aac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e0634afc8691682385763be870fe84c113ea81b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f90105988d34c022bca5a386dcee7f66795d90dd58bdaab04c46cbba9483eded +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..837c59b834ea24d3afb3afa18c216afdf1fc3abc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:340ac0be669789c8138ca62b49dcbb146ed8ebdbd4d19af24c570db92150dab9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2551e6b05dec2272cd828a0f6477ea79da46184 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4a4adaf8718b6ccb72bfc9ac08260d51589645534c0261594dbf711ab842672 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1e22972bb7725e2a00a48309c2ebb17efda5d1f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c34825709ca4d7aeafd2c74452c94a30018f2dbd58400f7b1a451884c73c69cb +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f358371a64859a054916c8af860058527101d3fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:239d35f09cc37c169e5a4f51139ced65622ec878912bbea4f114e34a929a43e1 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6275122c996c5aa22a491999ad83e110961b5f0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:908937402025847cd44e7ff38b6b27635b71b04ba82d6ec711f1c0432aac0c7c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cc53196cd0b77e591acf45a36c886ce12738efb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5b9274e53c033c8adaced0ad5d03358f1a9dd775e5539fe02bc80cc351f046c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a26b441b90a7f7e5dcf50da8a3a447e756e23d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c95751a298e182c893a565ab9f31c15bad5f5ed4a4762434f9043462f3193fa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b95487da77642ad75638e408cb0e71ebaef1d6e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b39650360d279e7945953a0c65fab7159b5caf190d7a25d340abb82988d504f0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5319966718927bcbfaa605495e54c07f593070c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2428f292cf421d8ee5aaf366080456bd77d36950c9ba92867d3a9f1f5a4f3f07 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa69d9208ae5e8d663e72fabb900fbd7a02e7ca7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebe6bcfc2ef406b2a6158577453315c22da6a6d43d7e30c666b11e015831f459 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8254707efbb2fae6521c441080a91fbc5001756b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d40176435697f987459ebb7730ebbdafc03f7c0c9607263fa1cb5c3ed95adc9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b8a5144beab6f5c576ba025eaadafd09c4a296a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a78d6afa21a90de521a974993c232789dfb07df71f020e6e06b81743955f66ae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3014c6d10047a70e9496e2a51e5680ef0b6bf52f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b03aa42afa7047e227d9d4dccd0370d68d1c122424918f73d06b06baea9e7145 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed80446494284ff43ec3e5bdc514119ec32c324e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e728dadd9797bf168d1e0208f1f660c89f0fa5cdc63e0afd165e6bf29de793e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa6e2d755f6269643800d826aa7dd8f62f759eb2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e622e1f44affa3ddb3937fabaed73fecb35e90a08542d170f321ecfc58c1001c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3031f7b83447f65ec90e360bc457a560d12783b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1735605c42ffedf1f991a456f508eba08f98f62b75c870ba7c0af307c22d3d52 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..edf9420e130529ca9d9fe1a293ef0595d8d92985 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a08ecbbaa6696bc17cb414c8220405562cfc43aa3406cbeff177e4d69710adc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a07668083c6ad94144e99acfa7e864711d99947f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0f498e8b8527aa6e941ba589b67b89890fa70f97429728123f165204d16b731 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cedb3d194bcec68321d8d30efc2469a917eedcf1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b76b6e61a3a96ecc9267d56b2d942d3e560a6cd2041c075a1e62ddda41a85ca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d9d8fa602a8dec9ce89776ebec79cbe577eb3a3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95d822f4b2d468dc39dd15bcd2e51fc897b01f46579323e1fadbe45db8984039 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb66838213b04acb7583f55ccbdcc4f30fa5dbea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8a3f8d226edfc653a0f93a696bfddb0527074c61240612460a5638ac181c443 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c507781cbf98bfca9b982cf14444a50fb0507f7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e0fe24be775e8ae6eb3d6c46057d809f30943fe72717c1ab1ba0f5eba44a532 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bf9b88e08e5c6e11da3ecd5fb95d8d5eabfdb03 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:815e87780a90969e4d85245293cead6dcfb2d2352ff0bbdedb08d3eb62d3e446 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4bc8fe927c1673b6597bfa92b528e5ba7f9edd9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:365af91779396bf2cfad7ad65e19a398f12d5358716a4f6a132dd69fa85060b9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..716ba33f6b9b592cf2257cfe4b736533e941e2b6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5953b7f14df1bd8e25aa57e0ac15bbfb1fc2f93bdd48e7a45996a368652165e1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6d9c50c57201d01d2d8c51fbad686f49ea3713a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41f8472ccb5f9fd0d692f4ab7014b0b0699705041296aeeb6dec442474bc5d61 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dab06a3a822352e95077d57e5eb00d8ed873af13 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87918b1d75fb2ba1a44573392bd5d04777cf54dfcf47122f0365380321ec68cb +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81d2bca2065dabcf4f309dc9992f9eb27f23e397 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cdd9ee6fb0e613788c00845e7a23cfe81ffc007d43dbf974f53ab42713bfbef +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d945a17d7ab7a5560a209a294e16891de4be13a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15f80e9703a0959c8400cb312b29e74f59d86c760d5435c1502702bb2755b226 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3b7204e17ee8df1bce902202dc87afdafa362fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b505a739353d352eb7a0a0de14736ea0f6aca8068fcf472427cb7c37fcaa170c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d502e8c670bd722c660fa67c5b0adf54cd362d09 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb590079326d73429d3abf58bfdc9af4af3918074b5c8f98fc9db8885afc21ec +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1064aa9a4af18f6a833f73f99a0b747fffdce23c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f33c40c1aba0b28ac37804a3ddfcf4435ba971b4f249024bd8885cd104e3e78 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a6f7d2f3b4a6f4625cb5abdd319404aa7904fb6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bad7890a7380e3d85abd69f1da71328bcaf3c9507671b5874e05fdddb8da57aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6fb985eea67d48cabe0e7745fe71829a1a2217a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af01f08cf6a2a92c29e14eb96bc6454ad74fc51ed98b19b0dae08af941cf8f33 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a73c4d21379bcb5b17f5da0b776259697069d396 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8abd1863d9fc0db8ecd7cdb86a34728335a4126e61caf980465fb8179a9e4a39 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f3e056089b3d56503604dcd59ace29eb6a58ab5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:050052db3e39dda1d6c748fa81056315dc799eec866b59bf9467fc2bd713b981 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..efde1bd2bf15b0df15175f5608598596e462c620 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:492d217e462022741dabbcc7b6d34e9592bc45fe5906068aee35c21a266b3354 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d8ad108c916576ea08c922f9f8bdc97c0997e7b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fa68e0839f4eecc5b0f0ac5a4a444119b9df3b110ebe49f726a513b53a61057 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c316f8ff0198c51221703609134862c0adde9443 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2557e0a0387d47491b14fba7386eeb88a820818789a21b478ef7fbc9c1c6b117 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6cd8450281cc4c5fb8dab719c4c4628735e0df4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ed85d53b6aa7441774e21163c042dedf23e36c93b8c1553aa2c44b024610633 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e20be6fee3822e0be256fde7cfc4bd794b5a6ff8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2476bf66c81ef25c3dcb89ec369cac7028483c86bbb1ae7b6198bea06271b442 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07a5bff77fa53f9ab9e30fe56a2e97be1e3f8493 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff15f926ab0d607c3cb4731314aa490445b77e7f225c216f621465eb0fb73d53 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64fdfa8a3bb714164ed6da5ff4dec1944b690bf1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09b5cd9a1527fe8b04e965e7cebd5345b4513a1f966b36c325bae5a0e44576a9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f1e45d43091acffa19eb57647f1ea96f5b65c94 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e215d48ec721487b8f36ddbb8c23f150a37704c24d929c27f59d9541e8c9a444 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..859b7ba64190c4551ea97029996f75f141efe5d7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf3a157dee6d842ee7972268aebbe7fc182eec51428fec8392f064b039f17707 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1169757ad2448eb534f44c6bec5e0c72ed10537 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c06d8bef392d1f7fc5a381ea4be69c1d27506fc841bd25b3c290de996d1dab34 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..59956eb66616d492ef88466770a1ef006b0d279e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5825b325fa20f1cbaec81c9ebaa465c7766ade9c0236e4a258d96ad582f02651 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91398e44e420c8d2e5d317682f4d7202369eaa73 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409b3a8c7d92dbf718cce1d3351bde0c2c51bbcd170b50020dc247036d1b4f7f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6060114a264b52b9d72430b7c21f3b814f9550d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82a53493ab79f58ad7ee400906b7b24e3ad4cf2fccc2a65f6b904bc7c1a3c53c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db622d766d58c55cc56161016cb73a959fd2a1c8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f0d8c14ba96437b1b1a96cc9a1fa7f3989b88bd18256bb1c115b7a3d0c5b42a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d7cd93ed68528eb54f790ca33626892d280e5c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a6555a7b60976a7b4d56ee9d68b933a7571f0370c496a52eceba29e20f4b3d7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c664c161420ae1441fd1cb6ac6310f13a9ac7276 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84ebc17bf7d297f39eefb9e0e7ec2be154ee736fc89cdf0ee08576e1a1af82f2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcc951669e24572f121a42eb3d4d8c58882d3966 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8b57d764c2e0475d1d1829ba1682a76627516f95bba7a21ef3eea411b7e35d5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..600b194036b1ae4e047cf0a367ec7b831836d756 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2c1498242c3174913a5c561aa1a7814db32b1797243719a45415c7ec75e7087 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..74ad6eee2c5cf6f0350142362b22547f8ecc8321 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d53ab3639d38af6bcebc253695de9783efead9e691f6a9abfedd2da9af27131 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8cdd0b10e5ab9c6c98549140e004ce1f5e3e6ef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:372307d73728acabecf76d539020ffd689e7166c8a7a413da29cd649f2071e6c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0a92a9e08bf5f74b9ca5018a80663d20ea588ac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b0b253cb0607cb491b77b6f1662dfca087d64f527b4141d0696fa84bcae5b22 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c32bb187f578f481040cfd60974d314cd85d8dcb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21cd2d21703d617f620597014d0fb6158cc610b1fb73d95bfd6196290e17b262 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfc945ad2eaf68bceaeb9aede1bcf35a245f70be --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03add787173428b19db42f74c6be1a69473491028d1668a65ee4b1fac6aafdbe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7357298bea480b1afe373d455bf0bbf5ea969df --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e347fcc3931faf99f5c5d17b925e7e9dfa10ae476505096366208df4104ed20 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..91fc390987115c50ea0522c5dba87cf3eeacf65a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef800b57a31f4e8149b2117e4e754abc5fabde63e3db3c940b4e6393bb3d64bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1a933f58cc913a4561c7e93cad89242dcb887b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24e969aa503339847bf978e20656ca6d71f7a128d7d994bbd18598ec352b6cd7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff38a14a68d743038eda69062168cf1b9fc0e7e5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7130df2406aa163279c6810d24a182f4942f19ab97e171d73afcd72df09cb0dd +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6658f2ae64822e66ee3b46ef3ab4ca517f1170b6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2027555508501fe52873369e1fca2f55642e60b33757dac3aa919ec2ecbf877c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eb14b8436c4bcd74f6098a821f64d38315f194e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ad9ff0ae57ca7d0a42754214f9cd050a7fe4391c1d68d75fe2b22150923dfc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d56f7e8b5db92c607e2a1ca1151ef7314f95926 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fefdfe5264420069f4717837d8e82984fde292f03d488f65374e5a4755ba078b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5548a4ab0ea7ed18cb8eca0a45a6b8d22195120 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:538cf0ac20e8e4f9071579fedd72770a8280c20e1c65bdb8a461822ba6c967a6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8068ad2d81d547c7d847b465a6d225c5f7fd4b6d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c08a592b07cb1a8ebd4d50a68d83eeb1f774b13085e32e1eba1009a24679a1e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3bbeb2f543a803ab2296bb5bf9b3efa13e045c4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f7787056d70969a752eda6384e176dc31bb18078868a9e9804787005ba9cab0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bccdf6daee32a87359b1d9d6a4fd24b89daf7131 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf8017cd0ae555a5b05a3b896c5915db46908492c0e6204825ad2e4793161add +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a2f48d3185b02eb3318113b7425a5fbf3974a7d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a2c9e8bb0f8c5154f121ed2b62fab1375cf7d0f9b13facdc9d0e3cfad820ceb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63f2f3327ae09514f010ba440ff6fe543b0dc599 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fd3dbfee3590e3853d5b87510d929315b4d387a39b01c3ec9375af647059f55 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd9576daa7b47ba7262549eff01b7803405ecb65 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64f1099e898de69248972dc89059f5482da736a5da6460780f72b5857cbe013b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7298ef4111180ea9e831f072159a1d057b392e9c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03a75c02a629c960026401b2eb55ad1f5bd02848e09d2a529aafc8dc8fadeaa7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50a6acf624959362db604717ef5ed0b8554b0879 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc2d85bc4786271414b6cd446cdb4e00fd8cd1ec1bbe649c0cf4f360520dfe1 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3d2b24a6dc891fe4276aef6838eee348bc0011a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:606628742e6ce085b553ea58523411c25ef44ade52f521a5c333210acb7facfc +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa1d28c1b01b5823d9df561640983613f90fbeba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef713a720c3459fedbaeb917d577f483607a40fc08833208a463f51677952a3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46ec8616e8418486baedbec275f91f8c8451cd55 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0224e61e7922b6f62acc6e933f145b339d5733d8316488006e2269e3f451ce08 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..942aa0dd0d83cdcfb41d7bcc1385a52e0ec9d33f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d598fcac59bbe50f5b57f3c9b9002ac7a8783970c4df10382cb1c72455e1bf3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aed9f21ad9a0234c7d987ab17bde5ae0b6a6a18 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2885906c0b9b95df85c81faaac0bba3864b6fc7e303d7f0006a02a6cf5d70433 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..761d3650b13c9a1137e860c4a208a0ac41de4742 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3655c35eb124a5af5e4fce4554866a5d287059724d5527e3d8578e4608928f71 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7b1341e9709e63ffa2dbcbd4db4a4867d11e5bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14a09c3142bea12212741260c4726652271a8138e15b4cf043fde3cb4bbb50e6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5c58b7ccee2be9cb9ef9dc96c836bd74123f95f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e25efc759a52f4c578a3737cffd09903da8d10a62faee9db92dff4a4198ffeae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f85d2a0a9f567ac42eb804c2b7faf8b95fc7de86 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97f131ffd7dd583fadb2bcc8d15e85aed4cd4273260b0d423b0d36b19305abad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d9543c366d842591c80abf476c605690a13af91 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79dded944c9d8e1b1dd4db26187b3350100377e5716f2d98b989d7a6d607c2ca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c510123df2c782ca29b02d2d6ee3c1eb02780be8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4a8945a1c73d024d4b1215f40d3008ff61a7b7bf35c9758ea9d5ed3b579b807 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..327a4597ecc8a3863b6b58d2fababa8a67df4195 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea978c1c9b191f4739e0158d9a8050c06f5ea26bf38e633c0142f8413472042e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee2e7a20b9c874aaaf6269848ef58f4ea298b67e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327ec221dd2c9c18772d1779bf056b8911acf9aa68e92ce4ab2055ebbbe24e76 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ebf24c202511a8f6f1593c608706be0cacbc415 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff9aa8b1e026bae65736c52656cdf4a3cb1c27938ad0f5b2f57363b9f1faa100 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9f45427ff6c7afd0dd6422a34b167f0055414a1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dff700cba64a07863acbcebbaca7c3509f65ad659ab90e8a3df57cb39bf2933 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eba6e1b40dc7d93bdec02bb29f291b4a87848ebb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd582aee6583886f89c5a6bd63aada0be91e80facee24a8c7e00f54346972efb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4441ddffb4922266be2ae28ca3df1108616a33c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33d0659c0f4b1d89531467eb54df6a3f8322e7347577980289bca6ff6c9209b3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bd031465e654043b1abeb89feed25ef25ebe358 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f4486ec2a58a0ab6cb27dc858cab713117e3ae4b4af64571501f7b91c4473c3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a68a3da3d1398d4dc4d016a528145c11b1f65eec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9aa951d195d98a8c4ea73b1f3d8aadb7e7d4dc9f54e4444df9ab47708cb7701 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b4a201158b0740af0e5450f9db72365f3c0cfd1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d7a1dba52c0c6707e4762cc52f76148204be3731fe56a7b0815622f75196ea2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e712e838748bc8a799bcf885ffa25e3a6472eef6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e85959a3e64dc0d0192f77c8248127243322b88dc378c050d43e71025610bda +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5c21549cca9b6ac05398631aef9f82ae12e2805 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:256b51d3345121570fffd59cb879089efb06adeccccbb5dd42c3716ec8263c7b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8803190859e736c963217ac2f34cc4161a7c9ad0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9e94e49f57e2dd7f4b227bbaaeebbfd2f28a297e97abafa05fce965c2e6cbf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55227e6b437c98aa7a2a2448b44b38aa557edcb4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5cdd3fd33315833ba9f2230344fbe6eb010220714516155050d7bd80a892df3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee8d0a95c407cb99a79b6bc3dda42b5cc5f60b63 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ca144f89b949c4f03d02a8c9059ea4e98e6fd5b8b7ecb9acb6d842b617f6ae +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27e781a4760b89b592890434cc98960ea8cf044d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:887d71dc2bd0690da114b4b13033eb539a2b1fa5deb569eb6d61abd1ee640aae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c23f119e95971e268f6f8aa56becefcdfe355933 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aa58213b85501d690f7c54717f3740c8dedb9849eb3d207925f08b5e31d28ea +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6aa9692edfce3754b4edfdab624b9ecd4c7cad8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23a97db39cdc12b31b97a97d09d79b49a96efa424eb172a82ada1e450f0d0ebd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ef79701fb50ce03d6cc9690101b110fd455ca30 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c906fde428e9578bd3487a1eba1e4cc33c89808877f84d5aa7c28df062070de +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40a2f0dff33e3dee10961b4741049e3b32f43578 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed5ce2a1f8545e624e08dcba95709c5d028da7700375a4c4cd8833c9397896db +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..702fc3b238133be739a3522c19478963da4a9c32 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31f03f08a1e89dadc933cafb4f5033fdcbd7850be755fa4bbe06f761ad6e63d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27c4b18e77edceaba4465e884989b0d071438841 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e789d5b975f73180c067db4667c9974bfd5ccd3f1e3a680a8535a6e5376c92a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..737e52dbd31bf66f46e4558dbbec741cc93ce5bd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49db0a6ff28fc0d7b31961300a361bb85b7ff870126015de1c5f97b3d2f92a84 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f66f090ea21022966157073c67e8cb5b8d1fa627 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8746913f6cdab2edddd6bbfa3d8b882000d93c8a01c714fcfe3a481687977c90 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c7347da8dba6441ab8174046828642684fcc07a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75f4a6e6a89240af91125e7fea43357953de0dc04d39f4ef6baf60214f825394 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5175583592eabe3eb29252bad01e654fae1976ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:203b46a834a8e18f7ecb06d7967ff98be89070f84659df56d507dd45adb141f2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d1041a1c1566cad3df4e511bcaefdf31fded8c4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2053d4ef082fa8d23e70cd313f02c389224b6fd151de287e56c6da00e696b934 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8646f429fc850f7c6e13e01fdc6f92d341fa005a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df45a92c58a1506dc5406b201d056559a96c92513f7da199ecce34385e42b22 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41962b159da3185a0c4cdb2cd4428b75a8ff8f54 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd850a050e04acceb5af5cd91eca5aba50b337a68b61c79fbb3cb7ed6348b566 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79b0da870dafea911d924d1e579bb916ec568400 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96e1ac09d5144b9aa3586e76f506f27ebd36b5066cf8609545270578cc9c649a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dcb51a1b10b9480cacbb6a4224901f6dfa1d339 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d65801a6fed15c3bcdcd693215c526bc4bd2588ae236d8d145bc2bda84ef30d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..51a53dd18e3043cc1673707fe18b89a42fca1fbc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f61225fcd3fa1263679b4b7504c3cd9451f75dc37088337bc071737246f8ce2d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd8e32a83aad76aff367f24dbda322c8bdc29158 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88b65e2060a8adcb38946147f411c447013fd01a896f518a092556d3ff781605 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d632e53f9cdaeddc7793a36a9f858ca6e7826ab2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff39fc015222612abf1f615086134285ca213be274196db0a1c4b9d6a87b109f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3803ca309257aa07759b258f3c5eed45eece0a84 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b88ed4c65f1bd699f555ca955c2aa3cff47ac41f5b46295d03100a649bd71bb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..885b9e6cb2c35d3f0d2fd427fd1c8ea9eed2bf27 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22eb8eeef94360afbc5b7f5501e5fcd9be3a7bf86ca761b314ab2ba70433ca08 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3ddce8e335b1ccaa987cf8cf19f965030f5c56f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f12c19b64edd8b6547014b6340c7416046811f9d9578d534da689745ff77f0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a38d7ce2da2da03cca32092e82370f42942f2b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:022bb5120e3aa34279aecf6c3278f3b17a3dc51a83fb357226a2fd9fe35eafa0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c751e6851f3ed4a072496be01d71e25bf2913ad1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa0a4066f38bd05fb8aae49544952ea9482177e28535069f916433d334977f8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3caa74720ded9c98c6109b45ee9a30cade0b2c8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88c69c1b95cf4eb442be989846926243a86669ad61c8705bcafde685555edf58 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4229e9e26d28b4e8415681952e28d29822f0718f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d553f7d41160d87b8a960dbcf533bda1074f391a1f9030ff876fd2cd9b27fb6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..939842af37ca2485aa214ed90547fb06e9c505eb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a283d04044ba7dfac1080fbd5f8514780f478c5ab6826842bee7a83c199dcbe5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b673e2d157ccb0621ad3a7a6d394d6a8e571142 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a4cbd652d5c2fcebbf0a7ef38025db77d350af3a33a1b8f922f4022d162f560 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c307cdea3e3b4b6b6af360496533a29106a55bd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f0c057c5d2a9b6f841d29eea913aa9518c50ae122d47d9e3148af4d0cdb9931 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5b360e27fd693c8d0ab2f728501890c853d7fa6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc383418a22d8962fe98a1e194a5bd70a4c6ce6dd78fa74a9be5e04e64af6ca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77f0baf85a1e0bccc7b0470bad738a8fe9968f26 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b191cbfc0e35768029ef2b91249f18a655e75892fbe5125f4e6eb7a55808850 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b85de68211bdcd4388c1c8fc2af1d8615c65f21b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:136780b32ecbf6bbc081523793fb5dc3abd874b8b2c6695316340c9e0e77aafb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dc12557c06d9ddd787c161674d647b1663992d3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4a99f3367dd1c1d61415816ac1017f8b9256b891143da1ca310022cd385851e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e977998b2fbff4212a81a786cdd2f45b1eb9ba1a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:647fa4fb5ac8135e07ad0fe998e13efde390f37193d38a0eaeecc16dcb5b0feb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e32ec4587e369adfab3a4576f4c949af41dee7a2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3444f00d1f48b3380c730ab3eec927de162c84468847851ddf103f9cd98e46c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2af7ef734e27f9659d51843502a63578783232d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a91896ef77c6afbef8678d29928830f424e68e2fd9ba7d12d7f5609d24572f0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..077b2d049858add991b38b97b43abc28261cfa3d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:085f6e9b7d3d00b1fcc1a8742502f605dfd409eec367f0f3465cce3a9b0bb995 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f147d55089470b47220f6acd1360f0ea4dc1e0b5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7414c73fa45ab489c87c61151db5498c661024757cc650629b19fce75b53974 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e6d5677e7b5caab3d9f62bfaedae56bb0b9668c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c1e57994997faa29672b8ecdefd0a811136b93adbcb5af5c34c2658df352c37 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dcc7cb6e311adc63d476d35deae7115ad2ca9dd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b5343ead1f8ddf10a23d42f0b6847308a22865aca5dd55acb81b373664adc8b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11f04c650c75ba08146dccfd2dadabacfede8b8e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e5e612a886e3b6b813ad65681b86249c2396af6fa04f588f4e3677bb1caeb83 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f20e8e38b38c1065784e63c05bbd9b731d2361d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d97cb1660b5c89618d2f090a573b5ea2f5dbb2449765ecd508ce15d96c041e24 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50b221f166e40cbb4bede6680a5010f7147aaefc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f94e5fda776696a5c18855099d7ffa6410571629b238ca39620cdf4dfb39de6d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c057bf8e25104d47d85ece1f0fc972b765fb7d6e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27f1fa23be29849d6bf90b260032ec7f9468ec56a36e184e63b43dad5d12e41c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3c991fc682d0f414022073f22ede50b20b121d8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cee472715b66f014fab190acbaaa1891cca75b78283903d85c02f5ed05b1e1e2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..616c701605fc4948b5d75caa4a603aaaa3faf6b2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdd45f3dfdada347c480cc739119b813a575c8b36abb3f1e6b858b9893f416b9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6365a46d8241a2ff7c5d406e8447a263ea06a2f1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:393e9ecf32c1b60bc1d09c9bc32c901b62575f81d9b4824eb141057ebfa1a787 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6720fe634d0ac84d8ea7ad0fa443a67ea21b88db --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79bc873e00251e95d2545cfff8e900339b72c770a395c259880985aa71530e5b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c553017018df510de7cfef25e39090208ff96f95 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:580f1ddd0a837c0dcb2960aeba6b385a46b8424ac0e79fd70119b7a8638a33b5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cb5affc8b2d935ae0efed90ecd2182f6d3c69f5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96c301f44873d8846fb86e2f7367672140edc487c7be677c5fc8f3d75c7c7c70 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df3511bae739a5958ef0e929c60c726b42181c6c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2860ea85da4917a661c6d4b169633bbbe45477d379eb5acabfa0dd60bde59b53 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b20a15d9e80b4798e36cda00ba1e1565bb59723 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f402c39cc44cabc236590d8776b5d8f7381bf702b2dbb12564158da2ceac0d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa59ee61c36719e71966ebfdaad1a2a023f7079e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb1706d38b4d618a39ae12c922e547dc031e9f3d8f15d36327d71033a3a9b1f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f68760fb965456bef76fb70546ade770a361f866 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78aa4acf4ecbeecfcb7da295ff7fe504a2a7a30ca718ce2ab9e426c9fde1282c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..985e9b3604099c286c46d3b2833b25b3acbe7374 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec06bbadeb3d89bded1832762a88aafc48f270b3d94a351f5e6ec81b73243395 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..353f53fd875a80f7a6053cfaf602ef93b13163f4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94a1abe169de2071a15e76924f694bfeab3212679948603daea4d9ceff9f943 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..34a02475d3387cbe91adee669e6787b0dad07936 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94d9bf7d1c7f53276906f697bf957c1a02c278976cc29415b64b5864f81985f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..577e75ffd55f8367064f753c739d36b7f0299152 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68a20c3eb334d54f86621ea522b7d661f1abfa40caaac70108d357e44acd90fe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..47abae8e1e9352c74e1edb57aee925610000442e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a531bd7b5ba2d6fe352e655fbda444a5149b253b0d1ed4feeef037c7403ec01 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..318b6bbdc6e4a5cfb1adfa4f2e922aded0e73b8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beb1f24277b55f3f4d409a5853da83b3faaa1de5bdd65ac2dda02cb9b8f8705b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac95d5a103e53dc9ecb131777bfb1b64c82372c7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d4a2a9a435a69372f518b539467e3048131a56fdda3d016f0c8960dd6994d2e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ae130605ec29cf6e7d0a043e2fd09d35a8c7db8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:201a02a64f0587420735d7be9dee15f4158fab5f90e9bb42e219943201de1f60 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aef206da30e5756946276f69fae451506530799d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b99e36121740a7687cf1ab7f66315daa308b3fbb798d0620dc52442156192d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96039b9b5c2096a3ef147d7628bf2ed606e4d1df --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5f4d51209842c29207ee1a7806c4e80c213a38258768246aa6cfed41cd652be +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1903205717882dba05ba1010b5fe3a176cfe2dbe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea6b0cc2fa37373f2a9b94b3daa0f6ad947780d35615ea82fe23bf2be9f7c91 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49998b97f98bcc349a76ae0c74c5c3cea806e709 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55aa3911f054b9be55ef120710650b3811f17ecf8badc7e7fc329849145537da +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03d3359b34c7d630f6ed70c1525a91b313df3864 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7158d45f7a8be505c0856c8d84e25489da2004f26134716cd96e17d3599f487 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cf34d13a57e2b41d38b337adb0b4f645cbf7711 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da8b5335489a797ac648542607bc7d8147bc0efffcf4f4db69fbbf39cf71878f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b54862c7d152396c001758bae244b85a89674ea7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0b66b90571ae22ff96505b9dac3871c3f0fafbf3ee0650cb0f9b7cde1e333a1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da990cf776c7c0a91e07d83eb9a8c68c173d023 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25259f39512eb16df9c41274635c170b62acec38c3b89ce1bcf0ad81cf6fdd1b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8944cf5c29b433571c0acefa495ca6e62b8834c1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c275e0fd85a66e80536edd43e863d795499e60a66586e7ff50d6f25bdfda60e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0b7908497ff289bf48aa05bc12cc823496d1092 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51f04de404d994c78232302094e704a3e498429e4d8922b12f13f530c997e127 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6514fcc21d696443e84950f1fdd46d023735a09c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60a838e90389a76fcf65056070ff9417077d3a64f6e0534a37a9dc5c8b0a7918 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89b20a19c9b31b758f0a12a6836ac6e1db968bac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af3033edc072231d752957f99b42d0b72b1d9e7c8a2cea6cc3b822012656b5c7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..93de88755541c725b3351dbbb34f989f263f31c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ab2877d58321e6e99799a0e75deb3538793d0c1d71a72763a31cbd08ebe965e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04872a25e9be1d2481170be8d48e90c8a3912149 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:614725a77645d017c17d7807dc7d6be74d561671c3ea0b7a1b3ba195a9feb857 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6362ee06ea376c548da3d8d79a2cbd14eca6f2da --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e7fbe396da35281b6594ca6032884c43ae74457c5d8154e28c30a152b9a48a0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5c59cd8302962d1ab37c1080ad11bea08113922 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a908285b30bfeb6b5f3cb72113c050c66abfa260f7eb6710246ff6c5551a9cf5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e89f8f3d690df97bf0736bc6cf5db13a92787306 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1369e71c41f0f96a922ba14a72227a4227135333dc558d08a7b3dcab7cc5ece +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdbc66e25e133333abf7866ec98b652b1bfd3a2f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0124a2c88c8551af3d42b431ad483010f426d55093ae3927b3ba941d29f5ca8e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae42ca11e19e5adb92292c26956bfc1b2e161f19 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20454246b5acab49278d05bf3526a011a278a0427472b81ec430a8df349ae70b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1a6e12d517e8a2c65d68cb7cbe546dceacbdb2e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f84133e87c231fd98e12f882ff81d1202e38e18996a908f7faeaa9624fa44c06 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50c888e0281e625927ac8d53400c138e9e39a730 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c69f1b1fbdbb644c948c98a9cbb935d1cf31d84f0316d01fe0d318a07eadd27 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8390bfcd2e780875936b142f7d08a7603482380 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ee9e06b8c09f4dd9ccb1c1367d09e81b7e630c42ce2d055e46a1fb3a6434c2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d49435e5526cc43820306d36adfadd75e85b0f92 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f81f68ca8a434178174b8d5b2f97d102d99ad1abd72baa985c8430fed269eccb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d03ff8c8d773b7413a03d7c58486800db33ed025 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6b19a2efd5e58e85543108b69115f7f3c7d7cc8ad3bcd9b0089a17f185ba99b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8780c8b87006d5e05cc6d49c7ad41a9604d85b1c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf3189c7ece43eb62b807511ff82d7e185f32515c30d3376bece27c22ae8bfad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c91c3d514d287ab6ca9c17b2f33c14b28c3c5be3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0381a0659ec4529133b44a5b58b8f3e7baa7dde93c7d902f0db967aec963f524 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b83d1be1106cc6cc3ed2b632de6b380e4aac6e77 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f26d518a4bdd2a9d1de633bad7e89f06c7e75dc0d7eb109ae5f51510ed0641d3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86040aa58b4ef0844aaadcba6ecd1c460706db6e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63943c18af094fef5b9ddae9590499b4cc292e0b01d7e59db9beec3867d600ad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d97a07beb096a3412350532ac2d4c768ee587ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3906d599e58000a05d02f0827bfee7fd04bf1ad6c8247dde286d122604c804c6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74adadeeeea19f1fb228f73db13c187e95748039 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08d9df59e473bd8cf45ee5ddc3842b7dc6ded2e4a628812fb5d37351b7be49a1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d117cc9abdbdfe459073051b2f8209a51b2adad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da06e86764e5f4cf26bbe61e1a078134aec20dd3f4a2c0232f09abf916d7260b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cb3b5e5528bca5d7e5732ae879314782ab60a3b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2cbda3de41c248bfdf301d8a68fa993793af522fdda8ff452c7ccc750292aa5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c9ce6cd0b8084ac8d98215c19c0148ce4bf3b01 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ae77088d9880d867551e44c5d25f82bdb73122f9ee556fee15d5f0446129167 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bd1f49eb98ddc8eccf2ccb8aab5ac9449d401a2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eedec7e482068d31bda0de5a9be2114e8896e2da2e1a88e6e9eb1d80628861e7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f48557e1223d22194f80abd288cc2aa503abc6af --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94fcc4d245511878e32ad8020a65dcbc77db1aa9ab3a9e7beac0cf00c9b32c20 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7390bde4fcf03df5fb8882dde8cd33213af1dd52 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08d36729d9c2024d420b25384573215aafcd44e3b339bdafb2f22f0f5335b801 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c7cf35f5f72342cbc125c5dca7fb6a506b79779 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b565e6fbacc8dcd1eb7e0d98ddd051d8fb1db842f41862387737980f9ecc7d20 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6afbd210e62728045c60800dd14b241913205b4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef2eeb7c2abce7e65515cac3089572324289823022f5f4368ef7f85df355a067 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..155fe6022255b090111807712ef191bb4b4b93fd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e43fe9c47803eceaae589056abc125ef2536f40b8fc5a1b9f6f00a3509f6bf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f45fadbdf1fd618afb33e5507d03093cf771dad6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a264ff1577e354bae139f0d25c12dcd589a893c01cc604126e660e553a89ee04 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d921063b86c9a63abb821e15023dbc73bb7f16d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4439dbf3c0356cf42dee8de08a52b0d9e61267cfd3757e2ae0a17c48cbfa367 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..984312bbdd8d50991bb4e25bc8b9d898ad18c4a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c884894071493c46a45bd1f78a67595cc38e6ce7212cb040079382c92222bd35 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f9b8ae81a8493413076822a68fcbe6258d036dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:956a9717a7ee7fce6995ca0771cca1075978a9bb6e5493ae1594daee5e1c9102 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..874987b4e806c7e29243a1b583fca1627b273ca3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:877d137fc997c88da8f31db5d311ecbe1a9ee840f04576fd949d2e906b2ff139 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6e3ed814e943d1f07f662e1a00df1981bd4417d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18984a3ba9f71c2a366ba352fddf8b9b6eee4b21829d74801a84fad7c5230d3c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1348050abc2a45286e1620c613660b7a73053188 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a2acd186fd3ff972c91d76930020a4d55558dcc76f20c2606afa29b63a677c0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a695891a93a0043029ec6d675a9aaa80c1a5cbf7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f7588372467accdb2709c194a321c02063efd1063bd2cb67cf503ac6847202b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdbcf7e51cba9977186ebc88b7fc61b8116e9540 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:751b89433b786fafb568984c90f16abd633bf0ce6d0bb97e34f1ea121cfcc570 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..42203edc70ae8caa91e6aabe455f6fcd9049fc87 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e0fac88daf502d223764ac94557723f9b56d3717c3988b75f6ee305e6b9e29f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..418fd73f2e375d78ca0880fb3a1c10d8dc716fcb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0e72f47e31dc829757e3577450559c52da527127bd89086e9a00bce36c22a3f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..101aa8a6c4579a80bf021bf74901a66097c55bb2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ae6568f67e55b69787f56a413657b801884e730cee4111a8a1176018d7d2e3f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b29906ac02e58ed0de984755e95d5d59b0f6940 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ccad490bc58fa85fcc14a006883f21d934574daa988dc3a9538b5fe96e993a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2c917b76b893b6e8d4ee64437923736e25c5602 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6f8a54f623d864462d50d9c106ac9a88353956ecbe663da9658b83629b4814f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c16bdc4b31f09f5ab6413649f1ef71cededd2ce --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:254c7b8d7430e15707c0895d5f59f29738a06a5fa70281390b8ed2899be64ef9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d225ed33db7d8efe76c1a32cc76ccc91cf114163 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4180d9950023a181a3aeb6894a96bb59654d2c773dcfffba840f62031b0c4aa0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83f79b7d9c95373f07d3596a1da3d3cf4abb412b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9941754a07c59b5e846b070a0a3349821b5e37c0645e5e4d011caf0d052c4375 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce8868b75f39813afa8581cf9ec594cef062d9ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d2d78716741f02295b07b4d3b8c327952996685c985216d14581b7d14a47bfa +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1b13cd3a9db3f15b2bc24845c96a9c5ea7fc596 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ca53c3cb089fc3aa08a2b8a3ede7732850e3fe65cab84c04c97d5f65467f173 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8be9a7d1872cb016f8281ab8668a15b5aacb2a4c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bdf7d6aba44750d81e1ddc3dc2f6c4a6eebc2225ac44fde65551c8b3f595662 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4965af7f17116f397db599f4534e4c4a0e1c049b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03fe5e9ad9225473fede0ce49a4c889df56c7bb100ec4f8e3191164ae3ab6c4a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7de94be02549a3cd358196fd0e051bea9abcea53 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26f85e8d2944d60b73fa89db4de5b706bd5e807dc1a7e7822d4565ec614e1f68 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e530db57a2e249824dc1294d0cc6e287205aebf3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ef074d72326c1907ed3626076c2ec319a22389f34ccd0bd40ab738a812d2d1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be5c5d76ce6b231975ce6a442db4595741c041b5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a773aef950c30421d64f42409f7d359593c0439dfd5fe9c662186e1fd39876 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f14b5b089c5ce8545b498c94603cbb9eeaaf7476 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bafef3d3bd122f65a05b24caa5d0f51bb641ce5f86a4f5773172ca16f6298508 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb487ecdd89a9e9ed87783606ed30ba6653741a1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:846c501eb09cc80fb6f943225281f86aafee480df7e3710cae1b645230dba73b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a4526a487a116a677d1adaa6e875bb34b306821 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef2b7a141a92c203227393cdc720fa293c12daa911e28fc9797b0d93566a0dc8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33e02528143bf5c7055ec67a99a2fd1bb4914065 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd4736f0fd1c9a31122150fc47c4224c3d71d8b00152ade3efa9d6043393d568 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e930158f8ea3018cd823fc6f05f9ad276b7f433 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9cbe1c413c4a839370ba7b210dda7fa6ef57366ba2395857508cadd858b1d7b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b26297ea77a06e8cd5bfbd499a750eb6fbef5dc5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5a4f253f39b99bd8316f14a44f1f04483b6226cc70e5ecb6d600675e980abf7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8b99c28284c31acf382a119df2edd0d0e546961 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbafb0c89811fc7570904c6facdc3ccb1160882588a31f17965640e93a0afe31 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c788fdff37a344eb08cddf15086541f1b6eb9f8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aad9dc878aa9a0f8fac2a6524382f86ecacd85870fc6dc0b48a44f3cb7cd2dcb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a628471746a19f81bc43e9e1c36d392c2dcb166 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c97ecaa508c052eb252ee0f5547865fe29e0dd4871e6439e789ee4b7a459ba7b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8053801a79f91b0293cc0b574a181cd1843c8b14 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f2cc1c168aee96db0d055f861017f3acbfcaf400d81db2a171732fff730fcf7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f88b93a73a8a4fbdda1371da53acf9e6a34019a8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b64303f91d344d28597c72dd27add4c54c300b88b4f37fe93827de6df891421e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ca5b3c636bc7da28bda8d52537afb1e56ee0e28 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:064ba34df63d2926b1bf7e852682ce532927e3b98483b5d92e8d13763a5c4c57 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17374fbe0f75412535d87a8222a6d9ece235a830 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71b320487dbef5aeb33ae3f4e4c10f1cc07f88b0dd569f211a533adb818a9522 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..94d9531cb45bfe3968efcc9d6efdc3fe99726dcb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3b69d026913d1ae7176d05b503a5980dcdee0719ff6dea53ca754803b3a4a06 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..932315d6769e356690fbbf0b1894c8c29f945f85 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31da851029e08e8a9cb72b8fa0879595bb73eb068973ec99f651f112e0931631 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ddab707229bea931e3c5afab1cda02b82c50113 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fceb7fc2b8f622fe0b4bee2ed066270e99ac4b45832b77df402b6fa79fee558 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db9db5de62e3efdd8e9f4d9239568c97641a0509 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c76c73bbc19730fbd3c4ad874357dbbb989a4e10f8a2428e4a316a3c206fa5c4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cec5020ef1f0d7c50df22d2579cad289ba0a0f53 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c93d42a02fbed649f81655a9b1c0a5dd152dcb3a38be599ca6b06d35571ec892 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..390330e9fd3fc34c7e02594e5d52f56c18f711b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:623ac9f59bbaa720ca762d657c77863ee9b1f8acc4de0cf30c02230877e9e83c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ea550060178d5c3c1be5c08822f3dae0d8e3b4e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fde143a25ddb016b10b9b1d672a2d33015c0e04fbbc7ae6c41b7ffb16da8e09c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ec8a99afa912cd3d0c933206157af735f333bd6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ed443e378d6d8dca1142a201dd2532c281d25a863b441aebd8bebeb3d37083 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e80e47f6b2728c3b63f424bed7a617f377b89d4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e39e09925727550471a4038bc0f66512500616dd5a351ff2696dd995a6c5f06 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6ea57d044487d6b450c552b9463deb2e1eeaa3a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8743ad34a889e608f62b7511634065e51df788e91a1e9619b462303bd593a70d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..91b4e2bff734f6aca3bb1ac95e62962c93721747 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91c203900925b4c6445c32b3e07a120a98d47a30b44ae164ebad9e71e78b0669 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e17f8afb0a0ebfc50f5fe92f849e48444016613 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4012ee7cc6f3b9d38943285f38d2aa6e86d98eb2f6605aecfce76c4180324669 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..162c103ceb2813ed5e72d010840dce5d88972cac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9108062a158d70d39f50e5345bcaa6462bd24bc715f3f63b32e64fe9235b154c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f1b7e1a638eab788b3997850af008532870511a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e88d600394aa044c016dd7ff0887bb0d441ece20eded879e433355f9b79e5660 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a95b140954ea582df670e3bd489cbff49dbed0a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:897e3ac3ca627e7720a28db358160d042fe45ae6fc46ea40e98cc5099d35a0e9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9829331ef84f5d80b123c23ee6ca732795555a1b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adf1494d20991b7e1b3b7a274007081058a54f5f1104337c5d074e321fa0dbd8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c9bca53b6b951d428cb9217fc79ee730a54f180 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:731179ae1c358b1679bd1f6d1bbefa022887b3ec9d3a89486e2a14678952f7a5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed7382b0a8d36fb87ae376c3caa07669cf233845 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c58433db929f20e3cffd2bf1006ebc59d63afad3bf702e28ef99176e443d248 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..61a5a11b10481c302d9574285947536bd74e518e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:191f3149458aa068d2b97c658e098da808eb6bd7a7b0f38c347eabdf433e7f98 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6f2ee7532bfadd1a6c6d12eee57e0e76e20b46b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc89ff6bdc988cc03cb3ec8c1537a7d030ed6aef6d80c05b59c9d59844ba3f76 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a389c601f90d3d39bbc28890a21653d117c2981 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:785cab9369b5d39df6d9d45be5c2bb1a6aab757ead0e8efb89d4a1b5dc1705cd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af92317c19e09705a823dbd91232c4374c8bbb16 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a2ed431f1512033e3ee4dcea00c66e2e1141f6ee8acd99df73d34e7d3a2885 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de8e6fcc9a317131cf3020c9e8e01b32a018b056 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffbf78447ef3802c5768061a064bcefe971b1c24c2f053f0849a5f31d7522b0d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..beafe25029b48e252bec6bcd4350223da874caaa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56362de41058c1978c14a95e8725dad0fc9fcda468b3291b6ca12d14b48d57c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df45ace765497df3a05e62e979fc05ad44ebc57a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c98e8b2b47d456b712a1dd4603f3e6f637cb02e4345d4c545b31abf708bac0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02ce1310406da72feb2e0900bfbd8ff1b47ffc9f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b295025bef6e5789e66e02b0c80562633999855917d565fa029b1903c811afa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d70ebfaea15546d3d9cc7531b7033730ea4ccc5d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0a27e2afbd0dc9840d0003b3193afd166da5858a0838555d7f4ae09701304ff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3e18973d34d9d6a119f876a7b642e6ea4468323 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b64d16c77285453be056b1223dded88b38b2ca4790739e9f97d2f7204f746d47 +size 11395