diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74adf017a2800b7210e9725183cc3ef852272568 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8d7e63717180534c58f1df9b06381cfd3ca80b9dfb68e61b777f2496c1711dd +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e21dd44ccb75618c5aecbaf8a0fe3e5b2efdd114 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a0066f0ac3b9f53d5ca3a5d410c9c313cc9b99bd189385b6517994d15597cfa +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21aaff3094b6acef7e23d75a7487451b3f7713a0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:811f616b83a030601ef6c897941c12b991d4970a5b9964a6befd5e44a8ba3203 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3ac950aa8e62bc8d628f91ad966f174a42327c5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd4f4238ba4fa01e22963f4e99a81d245dc99975ce01120e05238721ee29aa0e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99f7763d23c4b63c59c1e92bfaa1f70a53bcf1b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a056ce7a4057b204f46eec7578f88c7a498e42928bf78e3778a324f237dc6e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f974f011712327526a54acf20dca1310ad26721a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5510f9e6a5677fc3e3dbe161edcb7ee668e64d289ae1dd524c45287d0c53e531 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0747b9bfd67e743575aae322e44f8c48a0b4b1af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd1f0eaf1088c269df861f427722d35a799d190c836eb9c670c114b0f08edb12 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d502570993609c18895e03c08f2d3b24c5edde0f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23070b0d0b8b02db19317489e21df32a02ee497b1e224b06f2b11e42a00e44d6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1208a38bfcf6cbf8b0d6d5f52ec6ecb154dce0a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e220ba6a1c42784291442ce032e5c6822eff7227a058d91f7c100eec2594374b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c5ecaa0c9236897e6551d69856d5ac5e2a4944a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbf022de901598164301274865e0373e1f65350c3552ec08e20647183d894d70 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0282efd473a2b01044edddd751f4d83986f8fc38 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c47934c05b7e58b7ccd278ef0fb06f4094a3c8cd86911c2322b5f57e494a6cd4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7d1efc7c365a5ae58c4314d13283b27bc2579ca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a56fa8317a7c9196205fe45918f7a8b5a8c01d32f4e828d1a9dfe624eb5aef81 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dbd79fd762de48d5f9151dbd7f0be7e508c669d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a8bd91f3e3da727bb4a1e83a3ac61713253245f98c6f2c1b9b667d6aa6983f3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d46a65f08c5d08970eaef1fc3a7aea0b5194ef87 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0eca24cb0e0f4cb408ba4aed3e9a69e141a4f9f12a5520e751b5edb0278d80f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..001f672c2230374120602c460e1717c35b7c1228 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2ff3778de4ee3d7c5edbb639be7686fd1ef104d9bd8191a3d378abfa571a1e4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..61487c6ee9038add347cbe635aefd4ad8356a677 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f542a58c128745ab6b230ea8a2cb0a1b04f2553fef5513e386b3250fbc9e6f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..371eb927f33dc8809ce402b22832532618e59b06 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76565d316ff44f1c2c36752e1f8b7af0eb1c39ed557fa5afa0ec33fafd9583d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d7d7fb95fc7a7168440f6f5c65d263f5130d21c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6390ce0b9a142b291eeb4a4718eafcc80cd37ba9caff4577eadc480b0e4c916 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a57fad049e0949727cffb8bf3b334503b9bd438 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5633316c7006f68e3ba369e2bd08717f55a7e0a14970ee8b74297a4ed8454ca2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55e0b61e0e42e777b9ca0b819ae262164eca1fa9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d883e65b80cd900647773fe80c12ec3254491767fd2497a7c17052e698e3ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b921135b94b3f196901cb97408e94fe999df6899 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:276955c1a76d405a5844ba352b60a3a8ad591490df4bb1fccdd339d9ccb3ea9a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c203ad28ade8825f36d362a867e13dd7bf6e1898 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b0631ddbc8975bd307a295b9a96c1a09a71c1e76c66cef055839ff396cc013d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfb0dfc7bda6cf8fb8e65517802574659086b024 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91c5acea14c1c2979fbc5d69688a7bb55b7dcb0fe1bfbe97ce5a02e7aa75159e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49f9afeb66ed4d38f54086c8b440b13a7077c820 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1aa037144ee28b062c5c33e684403d7c5d7cbeef26956dabecc2740dd45916 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17f11e98adbffa4315e551d67ab6a1c5c21fffbe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7db024be318696d08e6e56e0a1b6bd3e126b0c69d3b621b12317b45307cec9d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68a99e3c1921ef60b06354055bfeba6e0f8a0f51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3227b5ed040f6ae9beccfeb7c732d40a5c09e06a35ef64bd048b099b4af0d4e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d449c73bb97958e7ea38b775757a371d5976c4f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1196d00b93a7f33666d98a04894303df8f967d5c0d8567f5211756067915d259 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be8192cdf5047a8e57a0525205ed3144df1181fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c93edcd55ec26752967d6fcf5d45bc1f12414077157d62858593b7c298867886 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..046ba04671023b8839097e89a18a8bed5562f20d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3092c5fbad9a991c7133b78adef9bfe1d338e133607d5d2fb79ef48310ff913f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0edebb9e03cfd341ac60ca99337de3aa941eb7bf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f0e78c3da627dfd31ada09ca0cc1a3af6f58be093c5f5d12820165f2fc795f9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93ff1ef20fe792c0d8de186b49528220020bdd88 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c461b41bf4cd742a456f5d64881050853c45a224637cd0b9cca8d8b20e6f4dc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..faaf18e58efa347392c5917e595e25362351c683 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39fde215b50dca5dfacdb7cd455018bb735ceaf068efc45537073a752e7fddee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77d1fec58b1158399f549774405d55e527005ffe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9adf1a5923dc99c8a5d10d63eb392944fdcd255dd481e5a1066b635506d54024 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80c932064ddcddff37d5f2f1fef4eab6dc187b50 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2540087e422dc648d6a28c517ec81fb37b635b26f507a3dbe22767ba58f9a67c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37c2662d8310ba61dd86782fa518eae21b6b8a28 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58c4fc295aae5f82dddf033c88776926ec78215c538dd0c377227efd1cfae7bb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..000f046cf693733b67439096cff1a8957cdebca4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4cb02694948d2f7b32d4b071f1857384b5745cccbf77c75cf21c1d2fb254335 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07219ca459d023d3daaa25ccd10a55a54baf3903 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07dc01e5c516438af3bd6f50cc2df7bee59fa858ac79ccd71d6d82d74bef53ad +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb64eb5811f9e1f57a1ff0356c9d5eb86d8f6c58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e887272560668019e91dab39faa9851e51721a6d0de01fda5d6a10968812270d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec57e88f841f88b81b11c71796560c03b139a761 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3fe372ba259ed8e61c86923b4715fdc4d6a546f8c094f9e226bd4a49682c0e0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84c9721f79f5a710153a5f44e80111b1ce554c64 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ec2606c60be9f8ba23c8d46c8acfddabb9ceb9d9fcb9243c85ab55530a70301 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4b02319cf78602f3ca44e9f8bbae4a2fa82e55f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86593ea49e739f24867bb6c5bc7a5937d242b1be8badb5657d648d759e8c0e0b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2983f07b292d059eb749a9e7d37b26fe01b805c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d777217afe15cda1e37b2b5dda45e537beffe6f0913163137b500fbfe291b4a0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c8a36d6d4c066e749ac38317e08fd503106bb29 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05eb3d20cb320ca07880dd59872d11576d3ed72743978d1081df9747f7f98062 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb0727f89a0b3791c761541d917aea6a2d2807b2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c4ee7933e6870c32bad6e6c92483d1e341fc61772b24144e831fbd4b7ea8ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5705e499423124de45b8ee7be23bc8e6daba0f1b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd5b1438ee3c563f38a15a97ea43935e369783833398811e2ccf7c29c8835178 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59327b218541c43a90166b00ab1de5567d5e492b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1132e77a836ef97f130517af81800a7f41b193dba25f8439dd80239d5e252f28 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e392bde31494b17d6697bba2209deff7a115cf6a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26bfa8082d0dc089674761bafac63fa2ab5cc9cfe955a057c1fc1630685ce066 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ed179613ca5554498b91e0c2da92df379b0f213 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acc7dc9d122ce86f373aad441b8b058e3a0c4cde42e4ddfea0f6f2c7fd55f13c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b525c2be7bc8d63f17c4379c610898bd51d0a2c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df33105c34b08006e5b30550f9fc0eb81c99d39450956cb962b9eac96e319548 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a22844a6bef8924db3b67cae6a46ce4c2a738da2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae3c7e38283a5f5e54db45cf32522bd9afb99772da796b2241d44c442f978f2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ab6f959f0627e58bd8909f38a71d58d486ea59a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad8535f34ec87adad6ac8e85e74e94ac97e747f544723a8eb6eca8ea374b8061 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6cafc3649b997de10858d764debd0790e301cdb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cba9c320a8d194c949d65e975068acfbe60970872605dccb84a8dd726f441952 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba5f9329d615d263030cef489b574a65c5f5dd13 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0663ef90faa04ef03f4d61adb4eae5687fdf2b5205d5fe48986c0a5d12bdd26 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d97339f88242be5470b6fdc2ad4509bef589672 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973646cbf813ee0f9cf9593d293e3a5a2a67f2db52126b24ead50db04a99eef0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fbafcb33034737be4df229a726fa55b7810e345 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba369981cc6d31cb88d7861f93d32467444b52ef12f4de4a5a7644cfb0ad2bac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5773b5d915d3e8f5597571bdec81b00705bfc39 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:124e13c8bfb02d64706f8503111d2b2d0a28ea8c5254185933beec133ba72ecb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97ab38fe575ca816ff60562e817e57ab78d129c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:981004e4282def29281b14ebfd09b5d56082f0516b3dc4a46fa0ced0b4fc4fb8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62398583074baebfcb859459873618f950ac6b83 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:078447c0d9518dd1c48ad841ff7f15499f059678ba33469b9885361360c8b693 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebd9bad7d2d106cdd39f9b33c74f94bc823c3277 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61b5742f72c78a0f5fd8fdc02a8229beea8ab46a60937b50298ba18f19c6b30d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1dd06d72cd74e7b776174ccc973c55058e658bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3172c64f8f8ec4c829a4840a3234ebdf510e38b1e36901ad3fad2fa1703cd644 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a0d92f3c662fbd69235660b39db7a9c57af6e28 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de0388886204bfbe2fbb5b20f1f89ec9567b36f3e1c6334b763715a4661d21b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2be07c73f8e3e9e24dcd4331012aabe2269289ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c1380364efbec989d038d6bacb110508328e99b0d01e1381afb9c2809a9c879 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae656c69763d46d2bd50bc8799fa479203a7379c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c148c1178f15ad613859a25f419455507f43053ae86c8eab3aadb73d7a0b0ad7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1a498fdf4fe77b652e6a5e57a9e15d8edbfec65 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:becd0a6e2f5469a6c9368295fde9f487e1f5dd7e6bb15ee531b144689c70b17d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7b5c7ec3f66c953a20ab27fae77f4334c332936 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dbbfdcaed7bb43bfa5c495dc588536e4e3f2ecac8de85c7719b5b58101541bc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f55f839d62e799cf51d719bc8db85cdb1c99e6c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db1b49d98233626d4e723c9e79250694bdf0f20a424e63a43d9925b94a9d065f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b18edd74011660ed255d18e0fb76cd456bf076e9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a33870e79ff64b807c82ac3ae71ec877396acaf9b0c013092ea104bcd51316a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca5f6989bba0bbbf4176337c63304fac6a8be0c9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecb98ef26c5a3e2d88925d07d51a99cae71b88d8a1a48689bb997785fc86c365 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..285abab4bcf5fcb31367acb9f8ee81ade4c14c48 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b82ee1241ce9e161a71607c8ab54ddb029686122356538cd18f1a025e490c484 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ab6264df9ba73d026f0c0ff4605c0c169a853c7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dbd666f743441a906c6e3d0316c92eec9bc70ade89a8d6f3f35c57df6b899ad +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9122600b13c6969f1c0aa9722fd1d2d5894689d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12bd6e2989b1a0e9498ac188646b5fc6d914b290347cf9d94f0e68db65d89712 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d803623f7f08eca4fd2769f88a297a3a6df9abbd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0637cbe85f8d4e7591c813758a80749c2406f3a2ee0739453ee207653a9ae1dc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c9ed5fb49c35b78553a93c54972db0857800054 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00ed42d0e1a00def34f3136b9d567c974416c44a4ab2986659decf451e381f37 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5374ed28f86aea4223e80cdb289de4ad0cf4be80 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0f9af532ec57ab77c81b1c7c22de1be04f940c348e62acf04e259687f3cf9a0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a6830681006ddd414ee0209fd28c04e7235969b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae821ab77aeda822529133094430b22545f077b153c8e9f9149aa05d28350519 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f103583a1081bf6f18e7172c215502f1ac7add1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf0fc22d20e77acb6b967057dd7eda6b3c95e52bac12468d3cdd566438e9dc79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f9354f5e7cea53f531d5b60709813147933eccc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fff6b072c37437ebe4de4f569386479bc46793d3964ac1e7b05c57328dfbbd4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ab3a8fe2762e0ea6fdd02acaea771080f9f877b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c19dcfbbccd146aa1213b9d2bd4d937439b2dd8e36a52b3cfc0800111e8d0b4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25216e06e2d5f4c758dfc4600e06b6fb9cbc0878 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a79d1ee19419b7f61dceb1213f644f2edede25fecea02e1b789061336ae21e1b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cfaacd8fffce9a5d9c9a6aaa084abe1dddd704d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0455c3d0af6e4563b2a01983e836257157680fd7df119b8f735a9e149f397ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e26066cf2d14f079bbea49fedef68d155ea8cf7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b36cc9e80ab1f234357927bc2d837910057a914306e57ffcea70fc7bdd8463f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..599a83dce84a9ec862e0d9a366a68c59e5c58ff5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a805e371ded3e1707ab2ebfb981c411dfa9f5ed6a4e5c3e3aa9272fdd00a1835 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6676ec9f07b9a6010bef5ecd1007a94856a8c335 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b02cb2cf882b0e8808ffcf9249f926e1c23c7fece97e296cf015c58c508e039 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88c57b507afcf3c61d44e5b0c51057ec7a8a9df4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1970f577316b5888540b97d45b7d92a7ecb2b0c4f908fba63ef5a7b5d3131c4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de55c8b2b03cf8d0efa1b38a46154d2e19d44c6a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b9c6271fdec1daeb6aaa353b6bba78d9d17ae1487c31136fabc41b83484d708 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06b4f8f786f44856d458b636603ae9849cb1eda7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5ddc5f3cef32b1156ccda6de3fba29365dd5f30657de26b7c7008831595b460 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b487d436752409084a588324322c432d7a3e2f16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7337e6429e33f024b0f246c5b18bb485b39560e65382746b9bc007b8ebba101 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7be5815116b1a4bbf60a1bd651454a3957fcc91 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e46766430d80a790314d60e611d4a04fdad393450824c94f429d7ce0ebcaf3c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df01409b22f0c3aeba3a094294bf4c4f88fbccf8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5930c070c0239a2dbe821e81607458a56289808463a3f6c7d313c51cf8a2db3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aab0265b7aa0d31716c53b7049fb1ce26fe4b589 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc5fbed8417300ee3f8cd45cc1cd4ee4188842e89c9b4434a64e9da4507836ed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1057a6710b3e4e5f31280352ff155d9688387384 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dbd7e002ca26c5d42e1b9799f44b2bca0790db9991f60e85d03c150647fe083 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5efe234ff9d9abcd5b6d1e5df0c07826718707f1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da0da864de08ae2e019c07bc5a778c28fc6153a536b2eda9e91ae87022965f9a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..075954952497a7cc71123b12b7507761f3bace7c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74691b31e095f06932db72e73e067e5cac720289d12f4928f4660d43db4639eb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e96c4f5fcf2b385f76e6e620164442930438bac9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:208c84cdf77f16d74bddcdcf4522e5a809c480d03ff0f2920168175194e2414a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..271caeb5f039ae6fcdc23bab7ba67b1e284d7a61 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd2bec180789b62132b0df52658093e07d30c643c47ab5c6e00ffb6f309c003f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee219425a90671de255d00e48d0abb3db6c53038 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69f71f7206fbaad45104aadd3b0b943cb1598e2a52fa163b3750b152e40cbd2e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7829d0c4efe2c7eaf337b98a7ce31cad5b4e2ecc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37b8a8c62fd280eb82a8949f52694ae41f6d71ee2c45fe2c3a74c44ab05e6b88 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6085d3de101cec388b073bcfd5158a9ae1bfa21e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da3e1bcb05fa91d93b9a58fe68082d73c7d18caf7fd1fbbcc0001bbc64ed2907 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecf2a4e3ee4fb81990eaea7841b416b270885eb2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8b965904aab6ccf1e79d5c06ecd81be111e6009b7fd670a6fb0056949c03e63 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7dc3a84dca27aae5ff1cb8320a4661b674588a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf40b63ab6f216f2a0c7cbbd402b52c40e3078db39b5c82be81b0727ed6d773e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c258612cd0022159ce0ba2af968fefe341c2ddf0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba5da5bd8dc8646361e12915213310cb67254d4213ffa2734128885dde3478f1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a9e521929329ce047e3385372dd99deab32a3fa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c43a317f544a5f5921e22a86d9f7bfae4c2809bc7549b06d66aa39fd1745da2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4cdcabe8a3eace150934608fbdea64a943073ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d011ce0356d9362ec7e5b183a29ecae3c7cef9addb5fefbbb784dac875193b76 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27183e99ef9bb2a59b6a06979b77df3b110040d9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:264c225c1f5739b1f75d8ebb8f80e17474fec7a936896a2d7668171d2de647c7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1610b1616b0263b0a5da24b3a9f896db762c2294 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20fef291ff3e8f01360731ba16fbd6d16017cdf53277ed419faf661f5f60d21c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df95ab65cf6edfe693b0da45e0544c000ec5a71c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:102b738f95790861289cfa384aa66d8b793843a12b6208a9a750c0533d2462e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..35785d3da7454df77e64f3007098bc10d4ebd7cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f39a72237e9e87dd414c441981eebf3390066faa41438ed1f523ddcf160cd7b6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6a3ecc44891b346e4ffbd221f12baa383e2a47f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545b48d0478dac5d206055644247a87394e5f5cc6ca7e21927dcba17e0fec486 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2466de3b7a441794b61f6015a367b58cbe58d7d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5bd06340357946ece52bf744ac08aed3cf70b48ececedf7b4da83b7bc7c5628 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46d2c56e39ddf4f9cbdc3d44367d1fdb8402bc01 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f45bbd2cc0514709d52109f49355a40a24427cbec854cd243bd508eac9762301 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4534bfcc891a4f8524ade9bc668515ab55863b86 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daef0ff1e4d8ca805092f9affac9b41d077a337937dadfbd5276709c6e6f4feb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f84e74de45b525e2103deb0ee94fcd18cef8f92 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7e88393744e3c601881f8dde3af68b5ded82a2112057c543c444cb37ba22c43 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cef1d058cab3e7864c16f6a9699d9c36decbe52c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a8bdc0fccf144ed552e6dfe2d9e8bdcad137a6a1b672399df140bdd2a1e597c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5806f93130a3d1f4e5ebcc5356fd58351eb231cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b3719e317d9ddef5558ecc4baee295c34d3cb58761fcbfe14515f05054f75d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02100309bfde7aaa923f9f91af0afee840243166 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09a6a606e4326b79ed8c6d872d5f7dc3e24c8cbc0e0d47f75b0cd6e6a34e4ee6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed59d5a591fc9da897f42600e61802f784ebe37 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b27faeefd9f2018a2cc7a81cc2b711a684a3a5017c28ca9f7412546efff3868 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e8773ee60bccc66505a28435aa66c0754770e12 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:417912d8800025243f9d12943fb5c47470e670a525656eded987ee763edb0acb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b717d67913cec0b369c8c5b8973b568cfd8b4129 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e00ab534e6a988c7e08a470b15af2ebafd4cd8b0d94b2f9cf599c121d6506786 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..748ce64bbf44023937e9a75ca5b36c05baf2b5dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c0ea10b6c275994fd04c55905ea8e2f526f70209d2e115ddea69b49bdf62601 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cc19e542581da22f2ffd544a412ad08461f284f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3279b8ebbd3987bf1b1ca7455138dc4e268b5f960bb12982685b6cf7f753240 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a284402a1bc3ab1f4f8b317c287447c79fb99f26 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f05a026ac1f89dc3ab5ba1abe262bfbffae9f0ff6202ce66f36e5cc41a710ae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..795ec622cbb2f0f9ee6012cee80b05316fbd5327 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec8a7347633576b2e14589197d16769869a8969893bb19db91b3c524d2410796 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b5b6690ddcb012401fb59982edfe8da246a6d63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2960966e93a9f4c32eebf9a93c6419a2a7cebc52ec770eef3577bcbf352471ee +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb0fc6d475df0d9aecbba5c213be6a8c2078291b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a8e363bfcda57845187ea54e73e897f92d8280a009a2da0e3f5baa463885f08 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0424af47625c8618faa666f59488dfa72463f6d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eebf67aa54b70417355a57eb644ff25c439a20f74e02e4215d259b9147f9ba0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0825d6e66dfa81d67b9f4c2c5270215d89234e13 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d7e886008249319fe7b9866f5a808ddadb9158ab7540046881b0ccedc6e37c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82984f701703cc01112a29ab4d43d2b8a8a605ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca3f4ab887159a1a5f1e5baa395d8d255cffdadf6338904517fe75451845ad6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..711f2c225b54741bbdc93b1e78ee7601565625cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae37371c3a3722f29553c0ede22d3ed5835c334ad43189ee87b8635dc9963d80 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd69f7f13766e406ee4c8d5aed0a45247b31fbe4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a2b832e89fae21b6343498af78230df7bab77a2e1b72fa3bc3fb2c2d3c69bb2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0121618f88ea77bb97f039a1d5c5dbcc21c80a4e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8498a3381d333e4033a1ba9bd83f1da854bd9c78171a15710f0c4be7d5b5864a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7e8069523b0c8a819f20b0656bac0c9ee45cea0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9440ee38a2fcc3cf5c4af05b3a078be4b9be5be03d8f28966381e2d64b15685f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d9a4705a3fb0d6cf809f9dfbb07d3bf3ee5c8e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a413ebbd3833f79f5b1ce2ce60e229ecf70c9793144e12b93b9f1abff7957b34 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66b20f7bcdcf9c6274f4b866d41d5dd3f2e5de0b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2e833a4ef8480f50309771dba9475780fd5d4e2754ba7cd6ec5786ed9ebec42 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..898d91372a40f044bcc4fcfcec261e55d1977b4c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b434b127721959303523a8d48ba4bc6072a9d86de24ef0f6ef39f5f693981dee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e76d64093eab50067562ad221beed4f1ce71d01 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0935a1b423666a99fc8ccd27871518e875609d35934316096b9a41145cd6f6e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..434a4a376cb97ddde18c811a3a096b6f4bdea7b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e62b140c640bfc56edd452515aa11eb02c819eccdfd2974d71114f1cb6ae01be +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..62ab60db940fcd225eb03ff8f1c8960696ffa835 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b9d6747ea3d1a22dac7bd13727c54b2282d22c952c03927031fbb114338ed40 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32cd96d4ca838c02e5ae6c765eec21f7e3406565 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff1c0827bad3ed89a5cd7014c470f7797b6d73c8605f4ac87b6c014c0dcf3304 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a84e44d540be66cb8bcb5a1b2f02e0b4a8262ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80ea26c58a8e11e8ef2d5ad15295255ce29e88a6936dd5cf3b8996ef58333c82 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80a4227afa4272711c40406329cb734d5f7ff4b8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ef0b80309dcb8e40146db7ca8c3210042b1a4b46329bf12ae5f37d1fce4da12 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d7fb2cf6de1e7a30eea2a60913eea5be01a5ef4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5af042a532da6a3f0e2884df338a6fe8cad0c231d0801f8303475fdea8f988b4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..caed8dbf587ceda78de4a1235656f3a44a45556a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1be6670fd01218413f9fe34f01324726b9f46930432af8fdc2da3477d61b916a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a9a9067c38985df167a3441661aaa0c2a7a8278 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3fa9b18b5db14a11364e9a98d497238e1c3eaadae9f6e15d5152172fce7b7b9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bc5ac3a02076387161c3436c85b10f6c8552166 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5edbdde7652959ed760261900ed3424f6aac88eb09374d085d3a1aa3f270be4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62935ce9d96dad3f96254886d4f5a44af9f2bd8e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f730573694fee5d020f0bfb5bb3ec2a16d04877b4df441f69928beb73d05ee86 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dcc33bb813b5cd8e111ca448340db408b44a6bc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd18ad16442fd54608e28cf8bce830cd48d35dd505683315986208bcb6172fa9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..135b343dac026ce5291210e11531a808db08a71f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e475cb177192fd172a98a71b9d3112a6f830c96ce4ac5e875be971ec4d96417a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbafa6ac633f3c4b9e6e323e740bd46aed38cb75 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7722403af3601aefdb781c16edcbbc23fbdf8cb634a475c4ac901b88eb68bc0b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27bcae1de9f7b41aa32973d0754ad347234eecec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7337bfb8e4d420a05373c576a8ffc7c6b4916add382c158474f574ae90294456 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cee9367508ec21ad266638c59089923aa4130be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c99c202d1e726472e4854e6809d68d9078da3e781ae61b85275d77d4da5773ff +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1e5fadf6926b551007e1a4a5f23d049bccc7742 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4875207ef0f88fd2304c1df7da36dac63fcc47771204bd281e64adb9364a9ff3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ffc2dad98c2a5bda8ea8611bfa7190e8f76b613 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee64947dc5997ae324a347c73fd392f1e3e2420798ad5b559fc1243136bae475 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d0e45081a84f7708b969a2f1e8432f3ee3b9d0c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaf0e4b6d91c281d66cc9e67f2798e13af6c1e156843e6904fed4146ded37cd1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..885dbc4a60ec815da7a461ede313d46d9226bf17 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2159403e9fb0899dd6dd69067d458b6a79fd9c3f8ed5d947ae2ec961de563b92 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f661d678d08bbfdb5a781e4f7139f416cc90cff9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a27b5f2ac3819329f2d60e767db5df5475f12c2b005c8e061a381e9efa527c49 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39eba8fb5f98c91934d621a9a374d800edda2e34 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be649277225b51a88919ac90f75624d19145cfbafd22652ca24a119ecf339434 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd03b3e4d3fc4d673dbb71d7a2adef3ba8805651 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90ba5ad5eb82841972e57cf989e7d5cc522c484fcdd6e5a66446945dd6ba5976 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a142fd9e33fb12306bfc7895bf1b213994394b35 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d396c5a8b746326d8accd558bbfad944b88182e6e725b1afe3913037b5eba5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf3261f2377c0751f473793b1f5e8d50b8a35c66 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb8b33f34a2e64e4c3e37b8b7466cc97148bdd3b7eb6d35163661e9b2d092621 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3726d941d4725ee81819359a5b222854f736272 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:643c135ed3600489f619fe82b74f40baa1988dd7c34258faa594abdec7110e78 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cc1f208bf587f03580bfe7d0e565976d124dbbc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccdc8ab803b8ebbae48fc5c7d04da2caa736e567c9baa0986b8aa99d2a0bb654 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd812fdf8f527effc92e586c25bf358cfe2ae49b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d479c2d777686fe1ee0025c2a21215c118070ab2aef3332da3ab89742fb830fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abcb8835c8061a013a9a6b4f151fe33e971f6366 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:873b6342ed014a84256fa00b2f446392698ed816d2a62093279315481b803536 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70decd08b64deb3bc8ba95568b8be9c7f24d143b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c03e2ee3d34816e34a1edfb69fced5c8c5fe5d9fb69965078285e10937e68e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4da630d43f0fb49afdc7d68be8a9a54b206751a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0376902c066da21c0c0579b6aabc25a3682034856f50827b10d4872c1c903612 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18cd90a38d411840da10b42e4385d7e0fe3ac5a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e15a863c309f39ee972cc896967c5315208ac752250b04ea34cbe10666042814 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32e0fef950fb0a3670610a51af6f52b6dcc56833 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a7bc4db737390aef984e0a0b3d997985d74f50096c4f44dc06407bc9a807070 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d49374b0af6779eedfdb6aaa8b06e3506652546b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a81568698c7795759cb469991e3ed05b38910ada0788bdc45e3e5ca513688c99 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d12d39295308ff34e81b6b06b7ec96b5cf83cc2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9285638f9ea33dfc7b94aaeef86c07cd66f9a4f31ca0847741df45a307516cc3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dc28fc31c2674a0e9c683b391c4b96c12f857cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c313760bb24462ecd4df0f575c740dfaab926b42d031f8d3e693bdc46905d5c0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca7c3aeaead31bc92719fe278b1a509b3527491d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2def1713d9ba5d9f235bca2b645a9f4e40ca2b800dc665637e6db3b60c49dfa4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..552fe41cebe183f0e6e64c48457cd904d0f0d7fa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ea7f8ac3ea83aede4f4eb87fedad640f6742e10d88d89c8fc2c4c313c374e2c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b739a06b11d2e9c98c2e7d741783b78c2844bd5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99e4ca3f1f52a699e3b05dfc932f1c7e95a3f882d7c0597fa2709ae53a23620f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79c99d9133209d8412c33b1ba839a811261536cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a04c6bade32da0bd034549d28a5f153440f07ea42cffae60385ea4acc3750a09 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..458df6f817b45de6096c3079ebe59f4ed2258b04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bece2eb4faa33b565776f3efea3f881459b3858e55eec7c33b2e9dc7b13fccc5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..654c10e4392a67f7f6996b0d71088af89d4fea7a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:634a28604ed1d1b154c9946c56d9173c0afdc4023a8bf190f33d03fd010b5c20 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef9e76bab160df342897824cc33b93c9383401b2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35af4de7a36d61dfe728df74075fefa264404683f98d43a731dbb45edc4b41f2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..806387c99d728ce6fa3b3cd94ef9a8b4c1698ca7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:479301b60f221e690d16f152d69646575e5daeeac4513544cb69661eaa9a374a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a9e0d4653f0c7d0f3040f0bef7f4ff3c2ec56bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f0b706adfa6dd6fb6ed219c947cbc0f39d3cce6c6bd655e5c2fc822aea0f7c0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb7bde77346c47192ecd203ca5d28deb4a5a8776 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdb7a8b59dd8795e08fa306a8b0f58408b9c8c035adfc39dc522f47d991a9d84 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90a4a265d2c21902f5a2d640e59e947fe69d8036 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88981fcf769720314ef92f09dc3c7c444d031a72364263d14f66d0183c44718b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..384641588eb7befab9c32ed9143594cfe02784a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e94d21c795aa9076bbad7aec0130700760d50b7c4c560ba6da4acfe1a16b57b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bf84ec8ab2562f07e244360a950b87acf67ad88 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b5f1bd903d33c1fdbea317030e4b2d5ebe0d0c24c5c98886af62e26039303ca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18673493952e66d7004bae763927e534aca641b8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a490e33772bf3dc7a4d686bc9504836e804d9938eb6fa42ddeaccd3b41ff18a0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b26f0d7328ba986e60f5c1c03433852a8fef2eab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7a7bddf4c3f794e82195f49c5e171b516ee973f6694d371f469054606b783cb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e76d69b39cc27a724d49770109bba5cf347830bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdc5d6e0bf688f701242413d78c691089ef3ed321e102d4f7ee2c6331891eacf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8d35bfb463a361c745eab9ff9c917faeee2a2fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2da7ec7d2ce3ea14d31171965f41b779212cbcfdcf6dc6bfd55b8ec9567d3e3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e48a7e0ecae96d2e8fa79ecd42fb35cfa5fc0866 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f151db830619463599be4e375b4725be69599f7c7b440ccc191aa5c5b8c3c95a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0862235b9a97731155d5f94dfe1ea39bf1073886 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8370092185bdee710b48f120c1bf6f00780b90856b1c41054ba0b895aa06f986 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e12c94904b3c5d2dd9a2475ca1e1fe6eb101038 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f6add5ba4bb3aec00b7c67c2748737e76cbaf97cc0beca75f406a38c3f1ed4a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71b2e85b120ce1709cf5e31051c828ae526d2b69 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0489e204e5b6d16fc45b557b6a3d9580dece997b7dd3b7ff62880931a048a5e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..914173011ffd20ab8eaca558cc0e66bdb92d33d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:782902e040f04c9e05140557bda9e094f8f94594041520110cb66eae4a858937 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dec4c3acde4cdd83c518938e469a6f9c62a73dc0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48d4600dc13e2fbd603f203a791236fe4f9bf21dd80bf6db92b45b0056e7696d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ef19e147c623f2701f10e9695f2651150b0cce4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39b896439c77658a8cd52ac70321b699032073716764cfb0937bf28f5fdb7c92 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..494e915b73d301ec19fde024e0a6c6d178c36626 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8f6c7c90e4de393e1d127dff34b4e7689c3da7eb4dcd5beb07f57913eaf5222 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de07ab993248b027d10c525a0965753cdd0ae4b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a64ffa541f3978a35bed545195c973991d0c5aad54e326a439fdeaf041d3a18 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71d7f9c782fa5305c03a4594bcbba7978447f2e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5210fdcbaff64e39b3bbb2f7a25f0efa21d712e5b1095b7d29e404875526fc6e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3adec844c40493786b8669ef230ef45cbd7c901f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7559e117401d4a3c5db7fefd6ae3fa15abd86fa991385b44bcf0d1e29bfa3152 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26ae8f629faeb9e680aa14e215641640654772bc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86ef09c37aa24af054d937887922325a1bf0744aa76795f5c1803fd1ea8f84d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbd70dff0d0ec61a13c601a9efaa5e57c6a17920 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fba0c6ab2e7fcadbe04e713fae2ab635f850411673eafe88a8b360972e2cd58 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c78c856ae11c63626b6ea05a27c9293bbab33a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c62fb7c76fc7e97ee3009640c6560fdfc6db2cc8c666e983a801d5376a70428a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c13923458dfe4cd0d99eb182cebebc7a318de789 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:778bb43abfdcee9fa1fa4500fb4ab90bf407e736ea496c13a8361ed63a02dc80 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e7370d75a5163a69924dd6f5840248ca2efda8d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e185c0c5641d2d07ed7ae75373d6798dd9c0070fe030dcd3cad4d3b8e7eb4b6e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ff55116838d57f2daab0f08ed181ed44f2a4afd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bebd570ff21005283d93d6d9e24ebf4e490c129382b1e916e51c5dabfe566b18 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eee36954f99330c41c60d1d8dcd7f47bd458f25 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:261b85e33321717140fc044a0a7e72d2f6e3a10a7b5b458303a1783ef50e542f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0236e5c81fe2c606894583f0d87effceedd9d944 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bd6a03b353d5ab22086fbffe6fc772179635736f9acf8abab3639331231b042 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bbe7f8fa2731f9cf30a29326ca81b8bd336cf7b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59d14b886754b4d008636312b4f6246765ed7f85e5e18e4a2c1448a5d568dce8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..faee5950f0402bdcd13a6432e7cfe0bb1a938095 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95b528ce3a89a39660b25e3bc4f315c67850cba58452a5fa03a47fe8a76a528 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5108f227f7ad6a965040fc2007a1f8940d05160 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5023b8856543e5af16d24b17303870a6d4fd9bca4e8aa79e75b3a570e8081048 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a480b68cc398ac0e7580ed07e24a7ea985b27f1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf731debcf4429bbca9fad457707b2626ec1944c8ab924c476d4d797a7e0e423 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c0b888e505ae7c40856c74bfe49264f5fb3e20d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b76f0b9c3b2713e1d6d334cb5ba9331b54761ac54b8ce95b2c4dbb24abadd54e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..055a1636afcdecd9c0ec39c54a06ca2e0e5035d8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c9085a61d64e3c5717f2407e4fd1e4fe6d91bfe06cc75f654ede190fafd9e6c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25d7b6d55386e8b8d1d10747e4f5fb06ff0e071e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66cad3b98cd491c0aba4a631c2ebb13b355ec63faac9764bb8267e7d1e8cf06b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..298f19773934069c2baa00750d610b443e0e989f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c927f4de306a0ddc3b5b258dea76edf31baf7294b1658a0331419a07620f9ec +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a0374c179aeb238b3ce37f08078fe2269f8b755 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79d1c6fbb072be11b6b69e97cbce149c0b65db00f6e2f5fedbb50813ea1f0e20 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e752ec0beab89ff17fd1c5019fce3c2a4d0d738c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0137a1b2653a0a475cae6281c7a3d9553b944f2455c6079279230c783f6d4f2e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59a455656cde5d10b15c57cd2269b50d6cfa86a8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70a0dbb4b696d778d34adfe6c7b120334b6acb19d13d89e5f3592faec8048318 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1159a5c0285d54a6753107b66db221be511c406b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61faa4268a796082a9fc716cebb8f41bd7a93049a8998a9309a14d95e6501ce3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdeffbe48360184fa8af205755bc58be1ac909ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83c9d911f23ae518b6511c2e66648940d10442a7cf46d31c4d349c84233d625e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b699a41154c63f8ff4e9f462a27c0bd911ff71b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddf0444f422b707735b554417c37751f73bbdb932e34a40ae6522841c98006df +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d6657245193d84b0f4f35d907c3b1450e0e16c7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e893abf7405cfeb499d1a47df55685e66e619f9b08980cc515b90031853797c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbb10dea4238f4183be7596e7e03c938a114d831 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1818fd945adbc942eaf19a7b954fd64cebf961d0551b6e7862204937d019a73d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76f9907b9390e0d364adaffb838dc8ff3f22ce74 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddeb9defd3bf624e34c5d16bdbcf1f8dc339447eaa36a4ca46054f08d03427f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc3cce950e954938f6f666ef93f229c2e8e951d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec7434308bff1b69cb0902c5698d26911acf57811469084c048f695479ad4e53 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bc9684ddc94a85502f6efa66d680863ea6aefaf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c96f657ab8d0f5bc8848450ce77d17a9acc992d779a93ed18072636cd3de092 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c21cee3ff1e73e618c42ad238e1afd053f93fde5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b10e186cc0217d44896f83bcf83c14eb815084e15f2fa893c17cd73641be08 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80009d7d8344e2c766863ef218123fd8f5b39d44 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b83335df28c1f204eb798e8782f6efce6d059fb695a6841bde2139b52234915 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f441434dc11595d50d457b57e9ba652a1dcae24 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ec371fbcfd6591f87cc6ff02146e692fde814fa5780f4ed9684dc73cdc88f5f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15650fb2dd134c721af57ad8abf215be0a455a28 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d542484a236e80f361486d28d97718091242142e8b77a5663b3985bfbe707d2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b04ac7d60d8fc0db279e37edcd88f6e207891555 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:590bf163eb989bc6e4e6a5f598b96a51cea5e86553383e9506dd9a9157d60c9d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eec7d2afec3522e70703f4439d76adeb54083aaf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc4b9cf2a8a05a4074fb48fa6ac7f18a197c84142fdb760dbba2b0def7cc7bb0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e4a2325e2139395bd02c4611ff5d77192b77967 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22437a285949bed7b3f4195051cfe05e215703573e6aa66ad47555023fa8b8c4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c52ec0f5c29be280a343e56b59bbf197c21c0ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ade8916063e842e3990ea048e99535f8dd0715ebf47872666ff14e6cbfa22644 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4ad04d301c56110fc5f3f9b2eca514d3b1e01c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3be0260e97c21b514bc4c9ebf37ed627ba4a28a3098409c051de1966be3e9418 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e2ae69929841a937b4f508629ea9a4015c1db58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afc4ae684b5cf11d21acbb4b1bfc66bcbd8054b74cd4468e0971cd3b4d8a2176 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..02e5b64a6f6fccbfb75dbbd2a73e61b0ff29ce98 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5db40c9627cdc1dbef667c18cf4c24d78ab29ba93652d1070217f153a352d781 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..700e3ecd1b8e4bd11f51926df23cbe50bd283c54 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42e2563a482e42cecb8c5688132333ca93750b41700eafd20eaf7a44dd9982bd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a278a567db3116f699c4a7f1142ca5e0279248db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cce3e94cad5f9d39dd47e34e1870854bfb36cd1c7f55cfe01f4298c84f6dcc63 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b84a099df710e0f5548a398d7d9d858cfa3c80a1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d7bc1797650ce506bd8fe3a745a7cbc1741a48d98da45b0ca3f5e62017db1fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3077db41054b432374c0f49147a3a33212f62ea4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51f3f5116a3b3dd9f835aee489994a24085351a4d1c9070d41b475bbc076436a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96792cd1b622988e6eb14ac9a155720b9d2095d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:840d6e57057121ef86961c654fbd60553e53052266a043d2a4ecdfac62d64e95 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad1522885db33f588b8d287b062745e2ac1644b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2233c118cf603ea218d4adb0bc807764540d25fdb099567bc194c027eeec1fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32a9a246d758ce1f5bc13a7e64c760ef5ee6134c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12f3d0020f32ca166d2470dd338b1ef1cd17d4e4a1c9dbf2933b826900845e90 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef8b39bc64417a80854bed1ee43f4889b4d0f10e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce39ea9f9e908d31fc87759dbc6b9386eb40a236a545338119ba3c77e9f244ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c742794ffbbdfcf1959ce2fc781c67a48d75cf33 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd69147d1bd9abff071077bf12be408cfba316ac49818c4af275fe293c68110d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..19f6ef05841348d808516b794e3658dbcfd60058 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e68253b8bbd3fcc2b03bb9a828d211c5a4e4ce7950ae06ad5a99015616fc023f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02c7e14ee4ab0988467c0334578d907660cb1353 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a6c17949cd85898ae9f87dbf0557b96af832104d3921333ef6241f6894a1bc9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d55628e73d421dcbd620a68abd538562592ba40 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d457472c55335aaa197c97264b9662e1e8833e4b6cf2001d92551fdeb7737564 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86dcd4b806e0c4bb7042b1df2b9fc568424b90b6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe31c7c60f4021adb9e1a0417bba3fd1c70886f339509520943fe9de25a5481 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8715c9c45a0d6bdece6f56476e06e16b98cde632 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26f1a3e05bf37c34d9b83fa47d3cad3e26a48990f13a2006b8a4ef36bd1eae0b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aba03398322065b4d3a8f2819ef05a1758207e4f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b40c6a4f5ffcd92c8f3c7d40dd8fa6d6d026e721dddadf31b65f227deb9825d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63e6f3510855cdbd53985452d34920a80a8465ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7493b2012e0e12296b6103d84446ddfe2e8020b7724e5b3eb0966bad252d6dd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b233f5e36b14bb62d7c49a809452a8f2aca4ced8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7249a53e34c241880842af6dd2304e743f0b77fa5031484551a7a7987bdd413 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df5e6aaae29fa0e463804dee26e63b960ad92b0c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dbb5526bd55c187e67a5926d4e72913c6fb85d63e6c58310919342c709307dd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..caac37145ad65dfa45f5f6311cc33f2f5cdee8aa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09577a13deb5e99e7fc5386b37198738393a3fb12cfffcf50cb204f7541a500c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f234399eddc013e174253f0126d71339e028666 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f841251ce4ae12b3fc5d055de2f03abb87485ad0aefd2108e08cfb4b08dc6cf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..946bf5b9cf5054330727458689230bb9e771e4d5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f4fdc8bb24212fe9a02471ebabc2489cf86f9c9aa145d71cb24104a941e7d42 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d88d50f52e66ed5b2419bff124d5c385875c1afe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8729003661f7b1164f0fdc6a390a0f54d7abfefacee7683dffb4038a5082162 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..621c83545d36a84edcefe982fb3bd6cd3d390335 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75b6b286bee840d3fda67f55b062726390a4f30b07b278c138e0597679259bc9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f10e335975966998c3aa9e4520ac7d727b9248eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:812b19c05fc046329364dd06f370978bfd70a6ff2f0a018957cdd009dfb535e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aadb841a567929440f3a5d486e7ee338b397806d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c76000e8a6f6f7389a94fa140a1e57f7a0f21bca5343ffe12722788875ae2d3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..309e36b8ee9251f052f7bdc6125e6ec96d5c114d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f52f5f1fe16cc8fc960ca1ef001ac40430d1f704fa1ae236da029fa70574d70d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9261b13310e7be364bfd1112382e14fa833733c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:315dbe8abf048cd2115559a542b44c620dcbcedab17a793e0a92d21b436b5e49 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a99eabd6df9ca1be75e5cb81553fb66cb7106f4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2abb15b07ea108af44fee17aff437953f2354f2cef286f2b6add45dbdc1c86a6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57045e96e0a89185f2decb00f42aace00a48fcb9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2db4ce0f286ba9a182aa9b220ddba9fac6c30db78c613d4abdc9260ca695b181 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c9f60509fb53bf09b263de28ac6771136f1e60c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3a8d577a5a30c824c458228a72bc3d49056d0a921a8f10d8913a1aff43fbb69 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eb30a872c6ef1e78352ec8da92312f2b2e3142f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823fc6ac4817dfd76ce2becff6984493a22ad450849874d44a2e140d19224e76 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b186f47f5fbc66cdf88bb2d2eb6ba6d0cefd4cf8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25ca1ae4cdda6c9140db3c9cd1e53526bbc8a5a79f7350a7f7bc451009f0017f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d033f867e06a58183285ffb499af992d519d0e0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f678a4d824aa69240cacdf3902e880391e9c6e61705a8dbe2918e67280be9776 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..955188da3fd00254657bbaa0e2a82d021dfd34fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0016dc2c27e7fb3873407d4a203c236c0a24822e8444b30875214f77049a24b1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f440645a7e9f03298c642fe9da82d6a72a16d6c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f5ecc745c3bae5a39d40ae40a68da35a11a646dc01c2a6044732a059a5c2bcd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8094d5fee0f2b2bc007587ca6b880804cc48846 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb31861a48d98222bab0c01fb09bcbd4375ee859489d90263670736712550d5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b5e702e8d217696e23ebadd906216be3b483d08 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:248d42144f781b8e8774391b2275bac232742a8bc088efb24873fb66880fb259 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..15a1f896b7f115e9268b74d43ea2832d2e616611 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:927e0eb6da86e445048712096ace4c1d9423292270cbe63d3d9fc9c40182c638 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e5361916156d4cb1c26e7c8140657221e6e8d51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f7bfed79bb6cecdc256dfa5af26d4054262cdc0bc8d6e6d6e8f674f7ce0338b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fba7229574e85aba865855eaa1a7f73d9496db77 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:630ea9e752374feac34443aadcc96132181806fec4a9049721c3933b5ac05fea +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..359cb7608acd50f547eb74f96e3f7066f735d499 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32b1b72f1dc81f31b3f2229216335ebd7f91089721e244e3a3edc6fd96001c3f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd480c0bb137b8536e3c37503bce4f16ba6b1bdf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f55b69015d3fa6b1a2da0313197245007e1aef055125bef85afa499283ddb69 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae16d8a59061c550d7aeed8ccad7cc5be815140a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b6d93319c56180e4e2e5d6be51d64366e478f79f38ca49e68d3e8cdfcd39cb9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52ceaa05cad60f478b03e65f4865c2a4fc9b06ae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3843ffa2bfb8e56b5d9326f0ba809a4156e3cdc35549a0c11982321c821de1da +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03e98a16e602625bd868132e13ed21a6d0d74933 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cf965d8179c56a36e43a8c55b359d0efb22fb1871f99a569759dcb283030304 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e2d32dc85b4b6c2d77911e5a88b9879bcbd7a62 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e1dd692b7e5ff16521410e4bc8fdcfa5d63adadae6d9544c3f8c22fb624bec4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..548b3503a51dc9e5b743191f1e8a7dbe721ba291 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8341390c236191503a1f1040168f5302d32a3ac3517cf14210153658908aa98 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f35df85ba23b1def3804088e3f0b1ff4b57cc0e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c315880417a494486fd0eb29b75a4b8722ff4c92742005af64472f27593732c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..896d19f8ab0299aba4cbb7069cd9955e2d667c73 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2efe6c679c1d034d34c2790a465a41c142b1e844c9ddb2de51706cdb4b77ee78 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f32f2e41be9114358ee96079408c2de178a40eb8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c745fa8a92c7403dd278d7a1f27db674baf9953fcc6b1190100990f9d68b508 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..241b55c2bcabcca0e780d99bad6c5e98a03c7c92 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fcbdcc70748c6bea7f2e34051448c8412089385e4f5b35b8c8340b3cef0137e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4d8c60ea11e67d75b7f80c22731f5c09f2f3502 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6219ca0f1cb1a47ec9b72a44323a412edd54f4d0f5a2adb90b6b510697729404 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d2837ddd74b1580ee71a0d2bdcae1517f2536e0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f5317d77daa8edac455f43b81ee7eeffcdaf46fc3c5f13a188c0b20bf2fd12c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c428c0cca79c96190aeb776be4ac399dff2a206c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed97e1b38ad85307b3718a1ee101309b60db27d6722008663b417bf99b50e491 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bed566fdbcdc0a33a05f6078b975c9ae9bdcbcc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f401dbf9de62e005dd69e9349b53ef3b6476f77b1c351fe1b907b016d4247b4f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e58b414ba66175df1bc394db3f8482b7ca252bc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29f98510d61a535574bfe9fd4b932a447b616d820f015e1b2afbcee7116cc074 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..680afab56758eafa90c6327f5d76664920ce5ce1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ba595304db129cf38261ce25a55db68309f5d7b28f25777fba99296bf2fd3d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40099a539f166fe8e02fb9fed8c392d73f0c6126 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58341d9cb9fe9539d7bbf55703ef9e32c82b7476ed2abc7df6874774f46c6810 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..101a4da74eed9301760e4662cf829bebc1a5b936 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:815b49920ebb745fe4840c8c469072fd5011479d780df94abfbbde19e5409f3e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6949c84168361c8237607c8d234a68b2e224628 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bbe86e0895d247bc524ce36607179428723c7c74a38302e56d63bf0a9976bb5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e4be1dbdf2d1b8dbf83d00ff0edf5e6e693d663 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9565878e80b73e5beb3c1d56c27ec401a5065610852b8e2a100cbe148aafd61a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6ce4bd72308abf53a7da525b169f5a6c925cd1c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fc5b089a5cb2dd6d95a838c47817d3bb1127dd0e1953cd30eb918f678629687 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5415a6e6f01d3a9b0b47fc7c23ecc956a7e07be1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb7576f9fe0eb64ebbdf0655c27d798304b7cf3578f9c7ae08e195a8f5dca14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06b4989603e49bb73d80775283c6ea6a9ff31358 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dad3870adb78e6d56fbf1adc33bc82677541c06f5dab5932606ba93afa248f5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15199dce07bfa298fad34ed70d6c077c7cb21592 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c9f44922311b1117d5d39c82ae560f11e61cfceea30928a06869813c8a4930 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d150234b25f2e8a4c2b77413c2dc9cefd6fc62d9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:278f7887fa6c78e4cde7b12ebe0015a8595f3f5922770ddc471f74e773ed6422 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f31fe92dfde440dc96d25f563dcbb0ab1d5b41e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b5b26d63df01acbddc86b02af26b79cc500c4adf0a3c13805bd79618b16f243 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eec92b22750cead7fcb21ba45b222afd716a01d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ff3b48d3155e58396a023d93356294a25f211c53661a85256795c3c1c1a90ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a646792c023df48db1f3640308bbeccad9600db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db476803c66da7bb83996cc07f21e436d1867704f75986089de34e60d4d452e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab5e7d08f150d1efd661fdb66da1eef8f6956873 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e47d54b70d71d1873d640d424f13ed769dcd5322b4082718e91f9ea67d8aecc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79fa4182a95ecf2fed12b56045f0ee7fbf465010 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a07dd4927c41a30a85247134efa029410ed598e6c496507bcd3fe5b2e7896ef4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a958a3b9fd45308052d1dc7f6c130e0615e4c6a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01f7111f677db1ffd84d04f99c63934d6606e989825fd0c8aec9bbc4233d0535 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d0d5aafac75be3b48980d8c97d7f44f93161a45 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:114caf2f41a393f1527ff0dc135d307993093c9c7a393446184597bc6f1b03d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c05d8a875bf2acb1803549f961334fbb583e505 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84f154410f6388600ad81cb9910269991b6f73cb19b8cece347173295d0051d7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cd7caaa20e9500d0d4030418c416ea45f95ccde --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:554974f24c92fb399a7ecca0a9a7f3daba8b50324afde5413a24eb17ddb51e4d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..67ae0947ab4eafdd76a280c9c3e058bfb96aedf8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cc4b9ffa02b7afeaf028caa953b5a83840f26c98fee5c409182565f7021bc16 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7e89fc90c4b298cc9908fc7853791a0f04d5aaa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d97f8f7bda67adeb340a5a3601dada074af81b2c380084227346b8700f302813 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c5d4c12632ccd3174b1d264d55e64e24f2d51e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:723c20d5669ac8e105287bae7c724f18ebe413c16ec6db9c9e41be1956d7f757 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a8e7420061db95bf36cff49a155d1b97b8bae5d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:208d16116ad0db812ad4483443c0f8fd921478719cea3213d8bfbf885de7f061 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b277caa0e8753c7ea93f85f996344f10fd734a7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:806ee3786f6b1abd5644bfc2d4462375f98a4ffd4170f2d0379eda3dc540b601 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec95c9eb6e1527621f2a63e7191264b48cc3c721 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d0dd3ebf430ced325428d491db63d99f94abb2092d1f567706920b9f18c9f8a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9ac222bf77d8a0e94cc49e0dc72cb506a9b0547 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bac81eaed67f5b88955576e49e301a6ef6867d3caacf7c4eb54d85d8aae32e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da36031af29df03b847a3338a3f5a11852b0109a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3865746a83d40e2bb8fa4926e7cf375c768407054004467e88e433a3137a9398 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9155744cc2c917ad68b8722491b7398016b21bcf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04f13b57c079b7a6ee9abe35f28f5ad23d8e86189a4babb8f5eb5e69eda4057e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ff11e8a6a3656191b2043f24f4ff9e3a068e2b0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6efb9f9229c611f2afec343b4ae0dbd67cf1bfa909c9831c21d90485ec43e07 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..676d24e6c19d815ef421f56910b2d02d1be3fc08 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce309d57e93d5c790e207d2ca4ea5f39f412a3f0c69171d69e72a8a3c30a99aa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b027aa1910c0432c4e7c02d0d1bf5e06809321ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c6e61dc4d14e4538676e6dae92b78eb4eafafaa0318e7ed28f7a03181f00ffe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a668e43eacad464be3452b600c59ac9b4c1de570 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71c62c07334e48bb4dd109a3f5804b95c155b0142986c0d57bf71e9e6bf7c84f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..069a83e85abb8193d904fdbbe520747bda750494 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54ab80b288a00cff74132d39f2e3febf95cb14e305aa2748c325df83c687deca +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..487ecbc984a0c1240e3c6926d8bee31c38db0241 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eb619c650bacd49510e3c45de966401b7c41f8c38259fbde73c1c6ac7da584a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b97fe6449b40b140843f6165d98f6c4780d42c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fbad0ab314ca0e1bce45e413789b7bf9c19bbdf6f1adfdf228542aa3cfc7a46 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ccabe5abd4787d15ff53dcff022b80c64fd93d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cce40c56628fbde20f7b98ef114b41710efbf23fb94f652f5861e6ff94474806 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73a86a18ac2765a7be8e21254359b5852da56a2f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f0a0e6f00732e9ce01dd22cf98ab61820ea1ccbf6c6723799c4f4a28f527d9b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d539fa21eb60e139507ee27692dace7c0286f0f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23577efc49b89ef59e47b680fc33e1b622dc7818f0817644c0fb5799208ff732 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f7db0f87e1ea1c2a49b9b2f251986aaa30f0010 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70cfb1f9878051ba33752c9c02840b4b6d0905cfeab79326a4d4a97b9d41eb1d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b18625f86ab0fe8c59d264a548b0df09380da3e3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:567daf0b4f244fe66d254e95405fa7f349e136eb3844569a92a2f996fb28a3f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..116299acdc42acdef322674c65b86ab400d92b52 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47c29f289da7091c79c7ec310cd56e2fb78325f82fbd391b8b4761c4e786863b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0db2583a13d944adc439995dfc1bcaaa07b18873 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfa9fb3d6b76973b070f1f4e12be9f97d93b3af7bd94d2484b95f189c2bc6f9f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2073324363863cc97d99979afafb02dbfb2706e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f68808bf78bfa1139e95e8bd7755b28d48cab15236af52cd88679738cbc37e0f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..74810dbd8b5b82604b4892c0a285c5b74304ffcc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b00c4448a13e0abd8587e710985b306955f6aa0b956e8ade37c9b646ccae85e0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae3ce59dd961d727fcd0c46f576dbbdc06b67ad9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce190951d3638bbd06cea7ee9f9b8514cace6f431e4eb601ccaab31ffee9c142 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9420e4f0fa91c24602bd146f4e8cb7050461c52 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70b1aff0cb70a0cc4748aa9ac08596de592c9d952eabe5a256b35d73a5c1155e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06f369f9b90e7df6fdaad065ca07a6e9cf7b9f2a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fe7dcafcf9c4f14332da82dee01923e76456396876cf8286ad363baebb41b77 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4f95ebbf208acdb96985acd78fb09c34b53c915 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1df801365d347822996e370ed84d0a5e96ff496a19c49e6622783369f6d9a137 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a71a9ec5ccb6c129b7f8647c64ff10df92365a06 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6dfe10b32391442bfa1c25683e46def2b8961fe003a69a4b7771be066a11098 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f97a13a2164dfd9586973e7b80ec581408768b19 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89b896b7acc9ed9bd3febe596d9e2ccd6f60872eb69c4973cabbc550db90d4bd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fcd143c188a2680a39ae83555f23f8a2a8abc9c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37617475fcecf0469e14df24f2d4d34d01ac6f2152a4f0f63418b5e2bcdbd044 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..56c44033d79d056ca58f8e35ea893a8cdd046a4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9e4611fdff3ec3b03661b1be23b20f0dd1dae9edb4f6f20c14416550467d146 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55b20ec41fd9428fccc30154afdd27e7d8dfde22 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:966bfd13240f57df2ba5ddd46ba615b7f7bfc4075de4604a1e844ed25c778abf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..37bb018d4c18d6b4a48191fd91349a2ed61f06f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6ec18d519dbab9ce2491aa0e332ba098a94e13da1263e5726c869e546fc53ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..599db63e7de3c111b7aab54ece1e1c6cb091e6ee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0af3d109d7c16b01b7802c198bf04208edce63239582daf7ea3bef839348b5f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..189311ffe7695293e893512ac6b6244638f88cbe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:119097e9387d861577de4a982ffd7928e2e7fc36f803c3d4c4f959c192ea90e6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17c3157fbfa869a1d905d2c7556d16201614e5f8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e926589aec344c987746a41a36d28b6385760c00495dbc274c1cc9f7e46332e8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..acc8b4a118263c07b4f302821d459bab5ba4c212 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:325c206d4d8098866bb921e9f5a09336c76a24e69b7ac47f61805761e1ccec51 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab71ce1c9892b5fc4bcc4ae394c98fca9dcbefb6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:939a563c4e8cb2f3cf4dc46699512ff7651d66c33a45a1d86130385aa163ea17 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c9d0d831f89e4da085ac2f075cf594965bdce63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:948119d3d325b3777d8c348350f6989a3878f4a826ca4f5b520db19a4092f7de +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..029a6501c36160c572d0d717cc9d74d5bd183788 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef5ea703a0ea2b5926b56b6bde28eac018f0b95ee281d48a957360e89f6ab341 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27c2cfed36ca51fa89e72da4780a284abf945436 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bf23e4b3e4e3e2bdcada300baf99955f49e490c18d151b054122bd5afad98d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7fcffefa7a7bc8a626b6923b739d2d599b8c93a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308d5ee86305e723f000779e4e00bac0b3cb44461bf1c490d2d7158c016fda9e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb0e263006a949e315077c372cddaa7b8d391e0f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f5cf2eb31aba373c2c82af758baf8a7c5fc213e2bca8d5eff4f7326f485bb1c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6389c10630da958e1330d10e808d9410c219ddbf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c970c87076df24e9c184d65b5a0e4cd725320befed81c11e3b1d7d891f7c0ee0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..58c758cd5146e016a09488ef2b90b92af8a90bf4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6941c6fce0a9af3935070b2fe020acb6b3ddded7a067116abde702fad73d3d3b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8bbd6f391f51d295e050d02faea1ed8422bd9cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d09f530aabb65afb73d1c48d66c07d630b35937513a4fbbe6661007d1c65bc09 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a5eb0d1393f0ac7dde71a3ed019462744ca78e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd6444312a4773c85789f53ddd33fbaf906dd58ff51d4731ccfa4ef0d08f2197 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7bb79516a0e382c0a8a4cb96e7bc50d69e37017 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526f69a6d5bb4998f3eb46d2ad7fb527d8f79e802351fc766508e9fb29a28e6c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..94f9fd4c980dd81c167dfe82ae7c191ead746149 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30e1b42965fe87e039cde2f7d68e884da44a99a0f9eb6eb09ef78a7a28c5acd8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1969181a8d2f3a7965fd659bb16d61e629eaa0a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e99880ea70b83f5b7a75f325e8c3935bb9121bef84f2b6dcd5456106bbbe2823 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70e9d41979e3671103bc3d899c72f57c870b5a4e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5743cdb576399bcdec6b0bc7d6c33aebb044c271df3c2fcd83391371f210ae7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b153cac1af0df7ba3a41e02d927cfa744a7daa0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e83ccebf806058312e50c8768379549f703222179c5fef2c3f593fb7bef7674 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b7bc035c31969a6f34bfe1b39c36cf62cc1ce94 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:184256e1596c7a89b4b0c11a575793fd36d0d6166b69492d09f9a9fb7026d636 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..782ea21c15f6e9891d46c1927eb15d6d828ad2f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a8a8fb5f2ce5c7982d7b8ae511fba73fcf42e900a0492736e5af32d12cbc867 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9338375226296903d4c05c41d574760dfe590c58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ac2b96a8948fd106c5e762e8188b34d12f053b3015094cc0996ea81c662047 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de06d189d73e9560c4e78bb4d5256fffd17fa344 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3392b756f7ab99b81be59c607360a99489810dc1ede8e6a601f9f7d56e33d72d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bb679e6478fe0e71898ed861d14bc95d3a8a18c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c1c9d93f290b323c612c3b8c39fd8181389c14fb866bfd6ee7df51910baf38 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..032052a659b083472755164221a4d3f553e4cbbe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6c31e69650c3e397f0f565a7056a97ad038ba1393c52b7f2bd18d1162e7c9ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6b6ef4a75936906edfcb1c7005d9bc5a6c5512a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:753d1bf9562b273622a48c601435939d74689663b9fee28134190c41af206ecc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bb67921013442b355f2c24613c7699aeff1b73d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe4034983cad16d5e7f76ab4337e0255c213d6989d48dd6ae7454f0e9a647b7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..21a5a562fafc4e3c7d9764254f6b7a50cd3ae675 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f906563ce35c7cd904133a1bac6d2c227ab08d60d9f65ff4c95dd701a18f3cd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2563a3c7f97ad2914d4d2039b45d7a72f8d2c05b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8f2b9bfeb9698450e0c2a67f5f1b06ff5036afd5a8ea4e29e6aec46f2afd34f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e91c9b5b4d62dba973258c4bc0c122139e066e16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b2b51131e337b232de0a710e8c3c5287944cbe2d7c2721d0a69c7019ca8460c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8293cd65a068af6e538567f87a3bca3b8f0868b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f63800c4e8b22ceec09ad385ce71668b86a2351b3863f7aaeafff4cf3adb9c5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea6a4a9e9e34623fc315cefbfa138abf54e79d5c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c2376484a73975bd2a035e345146c9c0a2543eebddcefd17fab81780f69a36f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..107232ab94b65bb9e7a1d582b5f9f08c502ea619 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9ce85ded9444bea603417865ce71c5a086f5b921feda31d801cc56f02912ebe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f9f4b5122c2ac297f4687d8b08f1450c41fde44 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2e0ce71006e8ded155c0aa0ea9d9dec5d3d8b424daaeabf3b4f6a85b07aac08 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bbd0592cf195d6c8083ab2ce95e77f542bd2fde --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f81906666b0dd51e69c2e0c3f4f76b330287baac16dc349a86f639ec167c1b2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3696748e961b90cd737f357c05c07ff41ab8a28 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50396d2b5c32796826599b123d4c8f59882923ea2c4e0bde4bca17a41862108d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6181f6db73a4b2bd3e947498ced16cb3f635963f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f238f4fc10d3c4dbc71b3b42925cb7aab2aee8b1775f8538d540730ef1d3d6a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bf7381d0ea068b41095c3a5a5d67d7c46bb3975 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:830bacf3aaff4f3788c243a38207e5a93d9a3edd20907aa3c837e7bbb9738fc9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26fe95287b1a505c88cc70fe3bdce46a8801ec5e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c89aefe5ff6f58f9636d5ec8606dc0c0fe2a6aa25e57bf8d19ed815951fef3d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c924d03d68acbccc86b62a9cd87ce94f3588a98 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb9eec7dd5c1cbed3413614dcc20c870476f9c0a5eb3f6039ece66989ca95e98 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97596a1780b88e53a24085a7fe176db5b029b848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:750675d5766d057977ffd3a38b36059db679449ead6ce45d4c5039045a81f58e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52fc91e9a532bdd45bd0015a912ece095ff99d0c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80b32ace8af9da46860d8fb1a95e066eedce0ffdb3f19d29fab066ba4ac9c661 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fbf26b787df6a0c6dd729d1e1fb18e8c7ec2b8f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df3dba9155f8b64b9fa527f4109648e6c71b1cb111d92d0e18d79356e4831a85 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5b518f392887c833425c962d33c6bd89083c923 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:861f600de4869e047b0c517bb86a80c4edd4651247061ba5cd142c25e5950320 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a31267c177ca2f99dce470c665ab9e616eb2bcc9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3af85b86a82a3ac9cff9adbbee0ba5d1d6586c212b26067e0cd29e6cfc9a1271 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbf2bdcdbdf337aafb12a4fc2b2a5f81cc675697 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4638689112715b998737d4ea506b0a619649a6abfc4152fddb0862d648120427 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af19cf84783934771788e897d879667151e479d0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77d968e8f87fc35320b4961d0da710139752211734ac264a251b6b1d9a3aaf60 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ed212342b6f37a53839e582623d2732d3eb42fa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46782639dc5968361ef960fdd84fbd8df2915edb1bde7bdd8be295fa47874442 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..405a1a0ed7c604f63a196e0b4a2126022ad2b5b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e863806b9dc77a31e89556456db0b94fb10d722c8e6769e1574ae7aea103768b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..78ed2fdbac6babce6f2ef38cbc11b411f3806ea6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf0589419a9ccbff9812360e3943b63cf7df45ea1679bf9be7dc21043b121f91 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2131e9cd73843da8f9b5c43986bb6446cab6fb80 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f5cd5e0913e762a9290e09fb0cc9dad148c2d53f17f0e8f8214d3cfb3e3c664 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb87ad0f1c2a5e08d8ad3ca3b5e11689799e5259 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8141487369fbb4be44581fbff384f64fef270cf5114c52b0b0065d3bb3613c4a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..541a25cca5253cf37ec1e14735c42a99f240e66a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8879ebda53d511accb1682f40a385d662312f7c89923b786d66210f9286f3a04 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00c9f00a3d750f6559b19fbc199a8b4c99af6560 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:067a21cfc6821f4673adec27514246898db96b96909e5c77bede4d2d0506db75 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..906ef565d1a03c1ce48c9660d5a49c2664401dea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39a4c86c68ae9e71c742c80a04afc816ef5ebbbe9ca7c8be3a89ccddf91c6898 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b3919d9a3d864a65e683e3da8b19736e1140d9c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab55da8bc2ac7a1f42b514768e3eae33e85c75cd4ac87f48479310d45f3e3c5b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86d063b4df32fbc1c40e96899e3b57bd4a6072a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b05c37909b0eef2ad8044eda474e6330cad31528e22a2faccfee8fbc5256ec2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf83d36266d2ba75c550d7641b5e4acb995feddd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c1ec08b069b9ba13d59bbcbb23767655cc85d52361d2d8316996953dce94915 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..533c828baa769bc2f754638790d48bfdda637368 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a5b1923c84dd9d488eeb14b533bf88ed979c0909f0a30ba8b92eb54d3803aa3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..052a7954e99942ca0a2c8b758ed9ff4f9570358e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7183f32a3c1190e420a9e677f458c1d4bb7aab0b34d95e49ee918f6b450939ed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71170233c2694ab24dd9b36a0a96ce935e8407db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6d8b0a06bfe15f987d224b2539245a1077bc1bb51d7fa089589f7019c7f7653 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c79cbd97896cd92618adacb65852ef158b7e8601 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70a9f5597b7cd397e55ace7571b7b3ba48bcf72eb37e4c24579f2ac8f326b2bf +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57d760a887e36711d48ca4d05eefdf26c68950dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9852850500305ddd27e18243418178fca1ad595acb4773da9557efa8a1adf181 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3fdd8426517eaf4bfcc702aad03d86e6ae5ddfa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1afcd9fb5664b7f4f82f8b15d7ded7cbb11600e73e475280d149ae5e5b4e3b5d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4024016e2e7a2e06503c3460acea82762f457c58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a7486d29fa6a6e9b9df91286215ed7c4d56d30f1bd8d0149c3ed1a05ab86972 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f3cb86cda5b471c5b9389fbe4c47305327fea8e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5edc384b2a7a897693a4929458425dbd65fdb0a9ef8519d2abf0043ca27b3ff7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4977572fd2733ea7fcc778fa8154f832a0d64a46 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfbeafeb875e39fb9515cfae1cf8c535e773d426199099464d26053cd0897cbf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..67c67986859ef770b8be4b80bf12463b2923011e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcc645667dd7487670a72c3dea72a4c4c577fe45779c1f40a9692aae9bd6b645 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccb28504ca242ee231e783f1854e912246925dac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e85e9086f876f08225aeb31563ff8d9e9fc756f8033acb7369da19306257f96 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..875b1ef2454b97361b2ee24068bab0be47a4395b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb4dd16b12f075881d4a3c49769acc1269feb292d222feeb4ea90dfbdc053726 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34939bcf5e1c48d95cf1f047239e9939ec583edc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0350433d539e1ca7ff38a9329472914712d25ef10fbc159de51f480fefea04b4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbe9db0dbd6352c0b08d3ebd827102cb6cf2e828 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24195d81ee34a5de423f27b141f8cfa83e926a0208707f2ddf0c3836944f093f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97a457e1a43efca62adc8df07adef8e1dbb1ab66 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccfe7ac95185d9f8d69d0d8a6bdc1834f2962d3fc7d52e7d7301a331ac8c4b4e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d41593fe47f5bee8d8e693b66e4000ce9e85ac2b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16e5e898e22c6ab03bea1d33dc0b5d7263b8fed0c5446e85bf582f0b64ee738f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c1011735feae648a06ed37c557c223c3e7b5389 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:987494e40b506d65f2442ef0d0bf121f14d1cbc4b5b5b2242b67c5444d3f921a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b59b9879485a818f49dc5514ddaebef078389c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:138865df667008777c858d1b05b98c4c4c3ce38c6e9d299e9bef25c0afc5a08e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e01838f211dfc1ee1046b006b1b59c6cfd16b986 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:781ebfe00adfc2452292b20762b394e69305e30d1412d691df28d9635a05932c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7ff9effcc36ec8c8f37612d033cf5a53eb551d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62df65ebf03bb58955aa425bcf2e77b00dea8d95e128ac9b3446d474f40416f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dadc370b379699b0ddb946342dc66e48eb79ea24 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f5bd429db707c7fcb56ebf98bc0be4d93e0df8f765a4709cc9d68dffaf8cf4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba5ac7ea93bc4d2ae05dcab32b2592c6d0e2962e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f45a98587fc1ae056e572508455a059a6969db613268fdbcab90de19d75755e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84a37c915ffb42cfe10ee95b0e540fcd55587f73 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:640c73a9fc962c587f8ae85dc76e488a68f7d2b382eaca3ca756cc2025b4e75b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ab1912f3115da76bbe337a1bddf9d79e744c337 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0443d06f9c709a3219a2b55b5a2ff7c60c8bf1499e48c88922100df6ae911dd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a69e778c0ef54dd9f489f5330590885f703566ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5feee665ca435f77e99fe365ce09e66b768c732222c6bad3d69f2efd81021763 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57fe5cca6c4583ffd103d15684bc7cdd0127703e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:301f6cb75bbe383970a697e014b196999c5db623b726feb574bc610c7ca075ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa5ac47710dce866797cc86ffea4ba0fce360051 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc0b7903e1c78b0b3531e247957fbe08d900eb09008fa6ff1a0dffcda784a511 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b16c16ecc9982160fd216c48c4105ffa7366f0d3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:850b255aef00023c824d9ccb9fd573a12048ec8a04d3a1b0f8b67871087c3bd2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a5fb326351a56908fc83bead6dc9e47d574a5e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe43879b3fdb7cc17dbab07534dfcff5ddaefd47b27c4b20fee77d4df517d047 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2ba2813ab1c2478c089384c8d966f73c7b040d4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:143b1dc4ddff91fcbeee062009cbec676a05aae8f66e4e1e99647ab0f3937e79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7958026e90da0ea6bcef0d98f6ab8e8034a29d4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fec89ac61c6dee047028f83d81db841cf54e24285bb80dd56536428b482d4f7b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50ccda7d183bbabe52d38ff1a59ea5c11d82bc91 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a4223d7390dca8c2d434860e0a9c8b5053965a5a1acc60643ce987de0b1978a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21d0b423a03396b68710dd377488277c4be986ec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec45ccb2b0eb6a483c6fe0aeac9bff25c2531d74df9bc0897f64608a2a9bfcef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f71adbda82d42dc67f636647181b3bd97474902d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:debdab5ae572bd379204245764fef777e2db7b8eea27e779a815a890db7e6100 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..072ad91e22fba25d84158648291a1e5a2b265edb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46b483452a9bd8e05ceee627b7593472a6883fbf45231a6e687d7d465cde510a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..44f72269d67e8381d45ba1bf827a7d5b347863cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17e2fcdbfa4947acf3de3f7172892e62679734cbba6621e0aa8018015c151c4a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65deaf8f6ea65f885e35e49d5b6abfd2e60a0dd3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1336875d21f92db2ac4a61eb3d9abc3a0856946b1a4048261a965f905d899a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d06d38f720df5e0d571a68a2c33ed507c2a76b96 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af6d464c3f1679e6ea646adc9ea201494d15b57bf0ba3c495242736e54104853 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6debdbff3e46c482c7b9fed947ee3780835ef55 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1ecd7000150ced99c548417e784aa81ed98766197035c1bfc868a7fe8883264 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e21cba2c3833e9d9ad7e1ab04d899723b9152f85 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42511aaebfc4e5da21847ec1a44b50b5f1fc862ad7a89793f994ad201070bb28 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44b83fae440311d37ef5a4a3fde2d3f791d3b1b0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3139199a52b5bc2ad983876f73a4def5c5a90a12ca41ae0ebb7dae2eded119bd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5654cd804c3e89f1f696a53c9bf4068d27bb6c40 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d441a65d8eadafaec44c36eada76747f6d8f5c328a1aa7588d052eaad0470da +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f16cac4e07ca770c3a74b9594de80c5188dfb615 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c2cda4cb638ad289f0fb6f80fc4387e066bec83d3072e76bdb8492f5aca6f56 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db8ee909368e68b0c1c8e3885e11b3b133e91f04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3b60405c250da21976ea25defc588f9ce398a2150f681fb55443835044c741 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20954bd0cfda46e179cbbd84efe20712362185e7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f328b20422343b0872bdc94da4c36c35668c1832da1f7626c89c6f6047920568 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..746cee2c130a833bd2a04c779c72158c564086a0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4722471fd4639fcc04af1b57f3668f0b237bdfc29d412cfaa9c325334385021 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bea9b1a04d81b9af0deddc3e856ae7f0b5a724ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca6b26dbb2de43c3da641a3dabc933510e4cde429dc1b0e71320038dfb96e530 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..910711ccac4a8f60b0516542beaeebb1ea376e63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:068b5ba733f03e0ce8f8ce137601e5194a7917b52dc4684143d253d71f851c76 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa1117adf87dba61fc0f7461924177b692e94a48 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f21d386d52f96a4696d8dd728fcd041e6eb776d30f4ec5adfa72d5b6ca69898e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0053c5fe8e1a45ecac41f0e57603f66c58d07c5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1707252383489b7e62a5718112ebf748cbf33f1ffb1e2e639e299df0108dbca3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..422076fa690ead631ef5871ea2f6039b111ba50f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31c0163a0a76f18484774d7e7aa9f925e9b6017fba844e474751451f07dfa997 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..62ccfd4ae613cb48265c4809d4fe1bb7fc1e666e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fd577ff441360612e28390fced012e95e7abcf05e1e15c5a62ad6a735eeb3bd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c96748386dda4e260deb9c865c49c62d773b4b86 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba949c04c429270497cd4eaad7796497550a2984c7be9658ec7b3d3cc8d40949 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f860d83510672e1eabdff096d741c2f5f7e2336d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41cbc2ba21cfd652e989bf2123be27e0138556aca985f6f64cec59fa5ff0a320 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab30674bf2b381a02881908843a9e6d79f4c260d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2437e2dda623661905ba40c82d64c2bbd32bcfb0e49dcb8bc0c011ff01d1869 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1c8235b31d5f198835700b24f1f7ad18c5d73f4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23bd2240cdd2cbdf6ac43d3dbffc68ca50bb217154244403e70c7be7be960935 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3c95d2413a0e805e2baa357331d108fd5cd2f41 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a645b5ca52bd876cddd656804d2bc7b93520f7021a755c30a26af24c91271868 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..028108770c51d5901a328f9b0e90afee98e9b744 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89dc22fa2c402739bbf90b772de95b9ac7acc3ba1c262b05b5a9ae86c682c2fe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f64fc0ca9d7ac5c232b1b07093c299ff88e355bf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:628aa925212020156fc05237c90583718b08d7e4945aa5e0eb42c50864a6d3b6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..961d53f8df721e564e1af02973d2b7aa4c8f4d62 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84e1daf5606a2bb336bfb60e02ba1e054b65e12c04dfdc7a167d33954c7b870c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf75caadcde005662d741519bf91976b7900fe53 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cfe631cb6eef0531caecc3e05f0a18bb5cc13c76fca8703ffab360537a59c2e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dff855aaece31350c2491ff00c7b491c604a87f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d53a452467d7566d3ccf308bf7f36facf66750d33cbfd05e139603b49ccf3ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fe618f981b042f409a7c55545677bc12eb2624a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff80f852128a5e99ced97d6ff970b69da91296d4da2a706b1e068c625d9773c1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf43461569892cd82fb5cb77f4637bf9d7ed11c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1c92388d72f32c66ed997461a26b750e70464dc0f066b6f3a5e47fa83535da9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b44380e264994d82d8c15f6255442333cc2e6811 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eeebdbf9ecba5bd5bbf7f054497681478dc4712e92c4430956604886aef8e42 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8877f4d9a3a95dcdd740e90d2832e586a25a3f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b781a628fd97e7b82d5873dc794d1d55842e1aa1009096270bedfc2e001e1121 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea945e07fd711c346ac3b32a907f77741247a950 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db9535d2750912a2d28f5cf5fb7750c74c6aa2e8577a4419d79c48cf65e754b3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3bed2119aa989a09a5a737314e1db544161a43d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:596d73e97bf010478cb98dd2ebb766893c635023ef8b65b79de3dc3eb125bae3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed7b5843a3bcef9417188e756e5fea119c8bf2b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf390c3828a3a9d58178d404f5b07a0221eedf670c7aa6c93124a1207314339c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..397016f351f6272fea42f9cbf5e4aa3e8f4f3e11 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42402274744b09734264ac6295768dc5cff80a2ff2dee46fe3c4c61360f36c32 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa5fe06848d1e0b9189bb6f4d1b58fc9ff77118c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bac9d3999afc8513d53512eaa7eca07fb28a086464fcb74bbe0fc4864f26cf4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef6bfa2eaf63f5bdef88f73bd4d34e746d802d45 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fafe0e566b0b84d30ed4b779263def8f89e97f30b14eba076f39f56a07753d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fda27e933900d8053caf811b693954e4bbe78392 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13178bf445adbf42bfc17456665a7451c13ee86f4c640a0688168fe4ed36b6ca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f8c5b2bb1606d2685ff0b5851e375af5d20f8f6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b884160440a8a726d5944e2e661ed6c08f6571bd1ac1386e8fdbe8e673276694 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f49ed2970c0bef127cac8b38355699f15a92af18 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acfef66fa1cedef9865febed90412791767835e9d72767111f2c0b868269e1c8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..412b0b01b0359dcf28d27ef5c75e3169723140c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8065b1b7b8dc7c27ed49b600fa2ad2dcbf35aaffa128688d546ebd4a1c3b8ad +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db58265650dafb2c2f6928456e21cc78278dda90 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1bf411ef16a5aae42cb979a1b54ba93fcc043cda7e66f39d95b368248312fc7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..967ab9ee58089881d137b9259ae58f6310c176be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dfd3860ebe9782912a4ec7f7ec2468f055c0bd3700276407025e966015a1720 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eea549d676ae8780c756033137cdb8f94a36af6b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f5bcdab231cd6b2d7b5a0786a82f79f3c4bcd0ea61bb8a23681eb15e2ca7f43 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df33a9f60043c0a6bc9cb86de81e86ab7a0de196 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b654486ded1f65fcc135f68f11fd4d80424d2c05c8f6e46391e26ce7cc922ee9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa73e9784a2415d09b3a36efc1086d7953b15590 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05786c1becd47b83a92162bb00b04bff8c925a8efaec791f007d6500b552f8a0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc096e60b8aeae11e409c7c488a6eb4781249ef5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d22a1b0f4f2868f195676c6c429840f4557e2d66dd82ca8c127925252bdebf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..021de6ebcf040b234694f1a54a65fadec4d35163 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d5a4a3abf043706ff2452280e660182e755e45c3d69e83167bc4daafe934342 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d93aaec7d35e445d864b66a21a98a50f8b960731 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52d84c0072cecc34ddc67c147baa9c249a6367b12346840ffe509d2dc5b6a37a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32b1732969645574c53d961745055ced598144dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b31635eeff0ea9f9dbf0110f0964477f8563a3eb4f0985a8ae032b3a1474abf1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cdfcd499ee2edc04ef94fdcba24b2047c31df2b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced6735d6ebac3950b9c2b815a047fcb5a92584a2558732be9c7feb3ff339aca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73629dc8bc307dcff17c876ce5ff16f3499f56b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b18a877f32ccabb198e33c32982f8a0ea44122c7111b34a5302b254fbf3c7488 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1ebeb6c5401f6bd9fcc76cd1779282cf9fb5b35 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01005b96f94535e941a7e57d4de3ad177aa015d66da19203eb8ffc1185cb62ca +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..031faf82645a90cd25016c42a21b7646406c144c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cccfed339991e8799d83cd7c77697887608f8a9760587962bea017654093c4ef +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53b681a217f3c0ef546855b6df59fe207d249972 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d893f3b4469bce1a78c1fd37d7403b9f06eb9acfadfda3503113ee6509395d60 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3003e3fd231b8cc4a7fceacccb8918244c9741c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e6b3d8cc3755b4766e27b936856d6426b187e0c97e05b11d3a8afd6d911889 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8db3c9d3391b11c0952e972cb1614f5c35f575ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:143bdc24fc9fbce7583819f71e029e7b3b24f8695d916f047d79a2d334f69823 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f76e42845fac2c851749dd73c183182ab0c142f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64fe2989df00418d09a07cc23610f2c262dabb30822225b43e604d8f119a16bc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6cf4f23f66ae64f8c72a499609ce5b8adf75d42 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6b8b9e62dbf256ce3cf5fe6c04f2715d4bef8ce3466a5bc5dc6eb3c31683ad0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16a4903581ff0ce33abb46eef3debe2a402f3990 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba5c03eb17c17a5bc72c25c456f97cfdd35c70d5dca60153f0478fb76fba5879 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bffe98e7220104d8914bba4cf7f06ec74e3476e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90437ae4fd7f100b57c00fcde42e9e10c2b5221114473681856dcbfa913f04cb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea1fd6e03b25698bc2348e64bc220b131d81126a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a7fa3ecf53aba0f31ad3df761157694c7da849038441428cb1b21054046af69 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3cd2ea26fb0f3eb87a78f198af06d4369fc7952 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a3f8c27f1282d724d2825f67db90485bcdbc28372de1b77e12276e190544160 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6aad8055fee89fd425cec44b3ab39fba68b54bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0081debad3dfee78a79787ded129e6aff30b4d479132c84b499f4eec992e792 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd14fb57519e293cefd791d4a7981779a5c0e4a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18065a67ac637cf563c395d65b63eedbcb74a80ea223ac56626bd1cc2193f5c2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c96e63f5bb221d262c89f4f56e0e7e5dd5d7f420 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:822b2f95be332f179c528450260ab33b52bc289978aba0deb85c1733899d8492 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8433b3de110b6ec4ed517e78b78df306b0663b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8bbd8523a41d04ca1db057abe5c3c79868ebadccb2eac9778879a6be7302623 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..426bc5cc529baeaf271e9b5db6eb070e585b9a3c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09b25d6236fcc0f1702a993297dbbfcbeb34f6ff4de88615637452b6b186160e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa2d0fe5d7f76ff175476dec57b3e17bb2bda19f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1fb620392e9b7a14d7187b293a4e5074879f92664f1ed9e67271ec4175e8fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66369804a5ef2e99c1cd3a8c2491301ca4bc3be9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6517c5c0070d25781a735ff220be48a7c18527ed16ea8161af9a8ba6d7700c09 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..05471e1bd45fd88a28dde4324d81e6f2d5ae4120 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2789f48a136b97f708650a712ed137a9a17d3af5c47da694d37ca96992a2b8f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6ea2161e42fdbb4330e402cf7d114a4c827e17b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:358b1f6e65adbda35f2b6d8107e172015f3eff234d4a5f886e860a8ccdf1f868 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..058f1fc5fd5a8e8e77db807bb7724693c336cf97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d04771cf3f4324149716cc5addb969df0b58d3970c13045e7d9f249439a70013 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..250197706f74d00f501652c31f763d6576f38748 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e202df9077ac6677d6ec793897b9eccae954a72ce341d99113ffcabb36e26f6c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..089ada72a1d7f1329e257ba725ac6ba6c82aea68 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257d8dfcd727c478ffe2a1b43bd4dccdcf6e14436fee782d173c797d73b3c0b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59d4a9fb3e32e98c2de830e1f902dbceb940b38d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df260c77ee9c7764146b88b92fff2eb0039607be35dee1ddf6f9b36e687310ac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7207b61c221c39e7b81ceeda11f032890ca1247 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:529a2737a6c164f8d94eac9923bffa0c8f0808b30b4b2a16f3c3d60b8276c522 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d9c55a2fee35f4cdc1e16d812844ece173e2074 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8880656f9ccfabb234cd530ab05801264f6124a2dbaacd188b6f51343d37322 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3b1f0d2d7d6c922599bb08e43fcdb722e4a5a7f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d576f13d74c099d446599007a0e999b3ad986c5a2202cbb830e0914332f4814 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69265de24be9ad587f51adc895b73da6705afef2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:126580279537d59c2b936e09a6bf809ba2c4528c12ddb9e7dfcb55bdaeb6c12a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4ca725468d554c65a87c8fabb2a7346ebaeff13 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8df95fb9257966b4b79387e51d2a50d806129ce139ddd235bb1d576a4dbfb43 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71b1dbe95c99df0ab06d777264eb83eb1d64d722 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7f4042d71044aade24e0d7691a7b6819d5e1d1dd5faf6bcb8479c312d1af909 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..754ae3eae7c4d26e986a23e88970ab2395db0818 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b04a0435b8bf74bbf76f224c477478c1e64624160e4aa7b2668eb84724cf4669 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2ee78af14fd3c6948d164bf92e24cbc96893a24 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a02cc8eea898f52169a16b54a727f9950cbb22f49e70dc435a8092af01a45c5e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d8c750e9d8df55b4b07117f13ef5ded08532ddd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d5178e674fe6c11dc303718b920464c114c4092c2a1172cf8adef5e88fd9734 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5d45c69f105447e121b14c98c8294b61848f10a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e4b8855d543d2e75cdd1159d39d8ce997b1f2d272e6d4790cd67c094ff22db2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee52126998465dd58d61752cb57240a4b6c19df9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a98ba4604f3f5e22ccfedd0134bca3da1052264374cdd2562fe9ff6a0e51058 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25ded3d21e8fb4515b30de7571684763f822beb3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78fc37522ac5fae3ae7a6fecea7d6f13426c1c2758613901560f5db22fdcb101 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ea9be93f9f92d339c1fae04538c764ba3406570 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d846b3cb05eff2b429ef2136d3dd54f1645233739b36f8505df09683668c40b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..788c97fb6c27ca1a40d0ddc1499b1c5ee6e8ffe9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b345f44d4b08604e7928442bcd5f6333d8fe76b8b612e4b77f11f790489ef756 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..668ee775e0acb5d8e27a6585cbdc4b2f8fe50faa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:825892a464085e8894d0b060dac1dd2d8a334fef004dc3f8cc26ec5e6b029fde +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e85ef9bb9a8f685e2fbb11ef05eb32ae76cb11e0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cf8a483ba8ac6e2297ae5046f9127e5b21a5f889d34f3e44abd72feb29f75a6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d733a2e7b10abbd6b99a67d74160214877c3b122 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cabeadf0176a3a2ecf6c203fd17176a19b2a15867be252a9ba1e8fbfa01f125 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5155ac6237e2639a15d268a5e89566a8626642bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba642292141e271c282a9b9f796e5b33ef866269869623131e820dd6edc2f76a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8060ee2e07b3856972f02861a0a7441d8d267299 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b61546a84485fe2085b2e351b3328f2bc48d01ecbf18962dccd0da7fbfce8e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58ad225524506712ff6e6584e1c8c1b5533957d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3fccad5a13570568e9d58d8caff0bfd08bcd9737cb04f954371cac7e0394b90 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57a4f56b3e9af54acae1e95223c8036cc357bc4d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a251a951de4a21e335316962115a62f2551f29ddae0cf316c4dd5228a6337cc4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..497502ac6e038316df914e7291fea35a6d867418 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97777493a17485f8eb9286e31aacd6ba8b8d0835103c4988fa9e4556e907c877 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..efb95469b06dd25c75ed7a9a38054cf7dd912a52 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7431b163d1c42734eea20421e081e6507d400a0703949b5bb548208bdcbab560 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d98912a59ae3f81f50d53bc49f95fb4a466734c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e552bcec5d06f34bdabb61ad645baf288bbdaccb33a08bde23bb7732992d205f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bdd3f8db98b101314594776709d14a2e6cc473c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad0de8e22c387b28e2dfbb93efbac27f474a68f46b4ba8d4703b89c78ae97a62 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4be0052c20b60421007d3d238810e0472130e959 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05c3ef0ffa2226de4ad27eeabfe9222b762ecc4f0c053ab8d6c9f5fbf2fa744c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..04120b4fba962f2ed7aca8f17211f7de1f21f4fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cb7dce08d96dc49d9204b5cc53b76e823c49a19310212c29f5f6649208358ef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b3ea6718290fb08ac5c679013bcd57adb509aab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96c37a2485540e2d5ded045511ee571f360845383e0870f589adcbc5ef511dfb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f380e723cf3bfeba94acf9c66973cdf8a946e987 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45c47a2375da12a7514187f9f94edab5becc3cade9d2e14f6c0a309d314e58a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cb89665ba8b011e1ffe659d675839775524a76e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf751e3994fc5ccc6b19e70a89277fa8141ddc8b73896f77ca70e165231ed2f4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..256bc8a6e99f0e731ff499de58f3b1096343d010 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ed5e9114274d247b2609a2dee68d39d47fa6f236b79ec51d0a6b561ae894667 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e5957fcbc42db0104a88b7afcae46d3c5d7894e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19fa4f9ffa02594b163baeac3228a41b699e61e8e8442603e490e8122fcbacc7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54cde7e6c52c313b3f2c50766fb7632dbddb3e6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c3b28a0d792ab1bf50ef87816e11c845cdd03d7b69fd5004a96408f14aafbb7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec78c8d68695984a07b97612bfe60a3dc1a1f3df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc8b11bc3d250df0cd863cb03c23525c938a4d6408554eebdcd0dfe05a96c1eb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b93b4f6d1b61c73034c0da51481b397a31828a01 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b615c9a26829b4fcedcde86c62422b610c131bce8528d1825fb754dc8146b01f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..696d1118f02efaf90d54b1c43f570394b6f4f8de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c822c4f2d26eb17bcadf5827cd95006f8479d06af1f1f29c4b4aa620c88b964c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..98614294ab4ec42e3cbc2ff710778ebb349f80a2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff0a09300df2ac35be1f36d4b0f077c088d3742ccca7a6dab1c91291455a2d0b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4ae74e96d07220901e84af0841c338b67910c68 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0820ec6e63f4b5e14b65473b798f4f72daa4c7da880f039a2afaa534e3a7793d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d38efe5c088d203240dad34115b72a7add0866d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9000030b741df83ad80ecf8683be5cc8d82b6b6fc3cf7351288e0e7dd2f7bf8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cef8283584ecd4bc2c7e6a62f3adf117e3da5b6f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855a12fb939d0598a7c7225116b9064b70edd0697a937fdab470cd98b141a2bc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..91af1aa8428c812d24215acc7d99b38c38096de5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1035582aec183eb7618ae568234627897ab46cd2f983fadcb52177557b5884fd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eb1c6d58489964f64ba039b71dd5be94521306d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11dad85970b9b5353fcafadc09b83ca49519cec66901868536e7a4f5a3d38643 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c578edef7b92776171d018bbebdee0d521e0a510 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c1f49939801e28a883faa8e82e3a646f8999d0d701b4dcc3bf0cf4162ec5d31 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9f7fdb89c3972a63cf3fb4af69ee6719ca1d6d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa7c7d0b112854c7c23a5f55cae1a57c1c8517368450f0ce903a859794ca7002 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b0503a1651c17f411e2a6579a1c4c69cdcd58ae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a7ef0a4eecae52a9c1ccb3c15ebc6ff621d09a80f47d67083b6c1d679a2465a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90e21b9cb6ca36ec9218527d11b978bcb47f90b2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fb015090a83c1edb45c681f26f39092ff4920f52864d63496f04493833b0baa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8f679a62d2fe233c5fc81156b41182cd1a47f55 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e84e1296ff3722915e82b076e78fa9c57e2b76c36704a445a14f2d014e23c85 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77eccc3fa54de993263f9ba1bc216211e8375783 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c90ab21acb76201f6739d931d0978e61756969791a1b692eef383bc6c0a190ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0271281a895b15e0b59b1d1edb4edcd6fbade6dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ed4f4952042bca260d1eca5768667a0a7e56eb15d266699f5758b898aa78033 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96f639573770028ceecad0ea779e600e4365623c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d64b71f716584d702c9ca636819464b0af9cc2debf993770526f19e4044eb7a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eae6cc336c7425bdc958547112e799ce947f81e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8e9d4b88c348f22548e9c09833d2ce28526b37debb9b9e56b0000990b934417 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee2ef22e869d6a918550fe658a3fd46601daa1a1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db3ff323def103b738d8cc06dfd863e763bc015cbf8f197f170e34da8e321b6d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ffb811ecdb59c12a9a419d17b2a0128abaac04a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb51207c658954cd164ae33bd084ca4413c3a3320fe243ea2d7c6a2087a3ffb3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11b6d4390d36c84773cf755b1ea094b0fe4aee44 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d32d291945fd71aa25dd9e3ea7377784b97412827fbf9cb97ee2961ae2620e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..66e1462b968f1e94a7fa1459f47e74f4a9456b8d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9970c6d49595b0293ebefeaf56b3e7bd9a7e53aa2ba07e0b9098019f40f5174 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bcd1f33ec6e96847d6e46950be13e7b3087903a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:236a2035f78d583a6f67c2607703434b494e399ab11459f62d2f4917eebe7805 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8f4f38d574e3aedcbb6f2312baaa967397a7844 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca705d46e48f0a5a580951b25dd27e73a99ef5ef7785a2b94d8ad16d31735f4d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9379ad6fff00d6d8e35cc0a719f0f7d16e842c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75e8eaab3d1e6e7e55cbaf7dccc5a632cd901520d3e084a8bd7948b3d65dc31f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3c67f73566aa862fb293c68087d822b627aba43 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:673ca428e61ed671b929cb71b0db1587825e17c160b3247f6ad3d0913533d5f3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..711f9821a3439815ebec9efeb947c2a7eeed2f03 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccebf2fa8825ae0390bf0f6dcf46e7d1aab4bea54ad7720da2de6ba6df72cdcd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d61239f8fab955815e21f4adeb45fa561431007 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc172f27105464a42abdde78e075d02973c841db2e6b1f146eae95e52e245e68 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0533a9ca56948f8ce5516493547f8ce992535de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a009fb324ffa2d6356bbd9e8b786b3c3e7e135bf6d3c46578d25c239466cfc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b8380d26642a1417505701b243577362fbb654e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7311062be3eae481a39d09909afa877df8056cf52c67dd8a75afac9c1c76daa8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e169ccf2bb453cf25dc4ac0f374e9377be433bbe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:120f4b156f11a1f5e91e8d2f45ece2f709c98629223e5daddcf03a630df2a81c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d1b9139d82633e6dbd7878a0164c29e87eb5500 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e1b1bd5b679d572bbef410d0986795f1b00543872042b8b5bb0c0307d793006 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..357bad37a67e4a3dcca324df857e98dd9945300c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7195820674436e098eb7c87bb5bcf4c2d0833d95b62cb88b4dfa1765106e8e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..74b309ae7cd9520e74133fe1124ac41aba1825da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdad897b6208fa5aee8065d66dc32057ff5a69d04e3dff39a06e91db1a2ec53c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2de7d08832f806d987a6551f0d7278047d41b310 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b3ba35b206b085bd757a665c0f907f0d71e1b0919126a9ba365f82ca4c50460 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8900f7c0675d050509990afbc07d05568fc8bae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1173a52ae8d59159d5c8029eaacbb9f06549ebe5c2b09de121d24c929ead7b45 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81a393343a0ac2bd1e7dcc2d4ce5e453af022282 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb73a5e7cd0ee1a04fe580dfd906a280de83931e220f12a6d6273d94c3b66bbd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..25c853781fb0605afb7dcb650cefa56d479eb45b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cdd273ae8665c260f0e2cb46e89e4725f535baaa5e107a2c6dc3e7d6806c24c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f73a4770e4da8996b35a39c633cac581132cadf9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03f1e4815a88b670d97794f09ae20d001623eeaf1c4e97d8f787575c001c1d44 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..94868701c4974072c3d6fb68da6f308625683f0d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83559d04db69cba8164e6977a8971831941cf26858c95941a82e9fd7fabd857c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dca9fcd0e3600de9a3d943c75c7cb3fb6648ea7a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0159a3648099f693bfdfb410a34e966a489d63e415da5d4f9ce69fd62ef5213 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f492acf1d93a70fc825ab75f9009aaad7a62638 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3887c4479719af3595f25b9a855b0bfe750d352336ed328ccae4beb32d78dcb1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66ee84972ff336838eda07b2f7706a5916b94722 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2034de14919c456ce207e21f44ebfeaec8d6c36f920e4355c086d506597c2a80 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4fe3252fbd8e6b6be434af2d535e8efd69cef1b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01d9f160e70cf0da6cc8715a80ad71d9be647cafe61ea906bf3a96e827223521 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ee6756cd88ade851c5e2b55ed4bd49e94009c28 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc9d0d3e4e537d548f5a2c6d3ef4de2ac6cbbb14fe495ec74e12fb09f5844f5b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d1f1f1214512ba87a0b7598d7a2e1b4b30c2640 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:848a8469b0eab3b6558152c7128fbc8062c2e6518e60c74faa4e3e7454886a53 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a3af9c208e49e53bbe08f921a5ae56c49a8bb4d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e07aa955fe6d5587a017de28af76140859f6340222bdbf653e293b3c998f3ff0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdc80f4f022d976a40c4275138d5020d7df86b71 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38513fbb51ae0873876080575573142fc810de18f32b3b4e808551e2f65161fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eaca3ba566990ac1edc465ac09e5e6fd7033a61 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:176a761a39a5a0198ebb22e78a89e6afe76d9fc37d545d2cec4a8ae0f71eb154 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8765c9544d7d0226ec87d268218fee7e0c4785d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04665797262e37d7a3d46add777828936c4a17a6cf30f267b05b536a867157e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..235ff280c497983d0ee75674e6ed11e157ec0d19 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b9d42bd73c3f3eca6472faa3c93f2b84a65969b28b20f926c0d1d16da01996b +size 11395