diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aea61322c645766d207d2b9a5524e7fc6f6adf69 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5263213fe60f2b7111545e7b462675298fe4ac804749a647a67c99b0b3689a27 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d47a09fd313383d6a805c62ccc06f890746d4da6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4b4cc89548335c0e1e3bac157297a139dc72d207b4ff46aa038f809e1f685be +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dc97c21b5bdd8ae79e454a4e0310394effe93de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c2b44ebd7cb68a1067173f09c28c8974cf8b8c76b1db4544a2d340f449bb23c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5698123cf9e123db749ce25e6fa59b7f62745af5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feca25623f006976adc4ede1c6a01a4734aaf3ce8be182f24e7305fcd80b5580 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8acabd613296f4c5a511b2e331afdfd62f809de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d655f23808cff417e9a579d0d253588a4b592bb89806fc0c2fb63ef3f8d24bb6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69112f6e245696475d31cdb3a4a2d9f8d9174664 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d0c02cc3e9d0647bb5283c2add2ab23f77851a547bf5f3e91d1e95a15062f5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..35b3aaeb01bc0a4ee37d81e0b1f44f1d5f01110f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3248ef19e3d857d6ffaa002a15f8af0edda3f6f2bfb4fa801e2e6d2107baca3e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..deae1fe5d238d89c01b8e9dd507ab6ec7b181786 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42151786b29b900b0269f607b3dd4977c91cf4af415c34818733edc2cba42753 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..355fd66a6964ebb1e6b297417d48f3fa8d948310 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de810299dabd37d80f892fb5d455200f35316ce859af7e9d491381452f526e76 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05febdc9e26027e1a2d6a757c31a7a6f0b050edc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae4dabb077e7e0e866077ba4a9eff2ed03fe7c8f24bf6d117c85873d405659e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..833eb1fd7cf78426d37d7c9a5627c699ff812314 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c43bdeb4e8db06886002dbc0202a063868683bda1f80b4ee30062a992db91f9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..124f727cf606a1114b1676379d6fa8e155f7f3ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2924137fb41c686b8f299950ceb1911b711266d62c65c44cc41cc279fa7819f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38d37963bda73416a58957e18ce9e4908e7eb648 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c4aaddb28c6b44b591bc773b89181af74ebcf4f0cf8e48402d0c791665688ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..680f7b961b29bf32570a8ad287fecd3411252dc0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:316cb2d8889fca9ca4257efedb2708054e3a4a5b45055c758c6f91522a5da2c3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75b55fcbfa47a710a69cc4771c5aac522e1b8ad9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aef6f389a84f5aa271bb1636255aced695a7118597718e2ea3d1d71aab67a186 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f883b5ed5b37c5320994157d2e983f300cccaa45 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:538e25441c7e7e3961c6e1ff33a66fa017121bcfa2ed481c3b04fff26e4a2388 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4daacfa6bb8b5e3075868206b76f2854c34f7b45 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f170176c55b4c962a63c94aad600e1511d2767550ad8511bf2f48b6fb082422b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40e9926d4e776b2154eb47183600f0368e828064 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:205d4e35f141b80406ed5520a6e92c39a38a7707e8c29e9b64c86fa6348774a0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e3efdbbf5e17d80e4e101e94672baa18e37c31a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0291fff1dcabdef5772ba4b463c0e58c9a7c18f22680ba85a9f1c12332467f1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9295ded26ec58c86fb07562eecc10cd914b02177 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d368d29e16b7bc4e2040f2ceb253549525dbf9f7e01330dd58e72bf6bcc37d29 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..310c0ac4044eec54331955de9c3baa6ae34bd473 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aff77567e0f3122c8719e579ab96706d4c393eda0c3802541a690d208f5270a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c423075a08a493b561c5b4ad362d689858516eac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82f3b77b5c266cecac619f24c08a33f456911b461ca3b6283c83d1dea974a67b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..054ec5aa017e1d7a76149d5013415f03e5c986dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a16487324410e492a407c7a8ff9d547611c9ce83417c8908132e26b20bf614d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a61f0befc65057a5792e472cffc39c9d74b9fba5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68c65a46965287154586ae654125405d807efc9e631916b214894ae01c1078c0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7351bc03374bd0fd6d259773944e8b575153b28 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3584806526e98927bc982007c43041fba0c31f435323d407946f1b03bdcb90da +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5359750159a857a649b7faba6aba2bd4605192de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e0b19679bf855de340464437937edb93324a74f07a890057f5ec4d20131e6d6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64b0a797c39a0385688089f7224e20a326c4068d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c735911330f1b63cfabc4b5aaa286395dd00d3e30a05b0d2f43dc37df7cadc7a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dde4619aa21778c9173e7ccbd6072c3b46f6393d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d6acd3f7c86a5db89f83b0f89c900630b17f796afafaf77f1f1d474cc626e29 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..462c82bab53335f0dcfb40e3ff7b709a77eacdfe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a1d6c92256421eeceee3061bc9e60ede386ebeefa7153005525f0f708cdc5f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e44b12fce1ec3488028227f26b7075c518d2868 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94f09c66c2190e691fdff68500a4a19142b96e78dab9f29574e683cb13d09067 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbc73eba95b7046bd0d4477b3e6944672d379eda --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:479bb67428dc5215865bd6c858aca099fc26ade78beb74338bd23ef169cd5c27 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..853c9830cf4e2e97125e3fd2d534c4ec7f5dc972 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0369a7ded73f5b17d0c82c6ee049d145d94c5921b5ca2dbf329b37667e496efc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..caf7f7cc3b8a02f6e41360316ed4d6676b4ce5c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:685e63a9662e24dcd02b276312d56e857cfb2293ffa7870d1b778224290f2544 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24f1bfda042aabf6b4aefb50c8b0502622fc5b57 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ee92051ab2480ccd1eed74a8b431fe407a87ff60f4c86ace641e19e17b51ec3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..34dd4312203e1dfd95b0ae648ee3c6668e1f7a10 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbe707683c540b2d7425be27095389c23119223429c9c1f361a8eb95ca1f4ff1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e88b9bb5a75eb62df5de71869b1ccbb868b14132 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf1aafa23526af7a511931399d3e3af8789a1d9781708a67762e9ba2ce7d36d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8a850b2286af86dbf9b76b2961caddde90e1bfe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0d88f59f0d66d21e2fd9cbbdcd5823c72ad585147aa4e7d0fa25541829a40c3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ace8a06002d004d015d34b9d9c35bbb8ccaf224 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a9f67daf19f1d34f27ff2458911cc5e7cbb6eb5900c7cbd8dfff3591b96e3f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..daf6f6aab2c985802afd58d76b7a39fbddebc6e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1acd5d9adb3eefa2d6842de0f745b4ae7e02181ae8b847160f38f21586bb9bbd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7650388b00651e777267cf5012af993280e2e44 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cd1179aa7222485621e3f486183c28f3a3e0abb09c330be5bf6b05cae847b68 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8166e9e2a6111c5dbe0d4eea8fcd182017d5072 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2234c60211ca5e68292fc53b8baed184ce5c4a2d31da28f7e3c7d6169392e6b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b3d140557b4d5bb6e97d53e3796ca0aa71cab76 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99c30a9a747f734d5ef580d2415ca8c743a2622fc431fec1724591db37c6220f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1169953e871aaa773f0277f20c74a9b9da7b46b8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22fa0943ecf025405aeb369f6c86b61789082994ad5360dbfc74de44b1882e68 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0934ef42c9b38c2fa74b09317764e975f84b661d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:922dd62ecc9554a91aab19b590757a33c9ce0d696e6b86a9791f2af1406f723b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9576e8a63a4eb7fed8f1505bac3e21c77cff97d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef225f73f0bd400622e6fc698c9053d83a196e170596cb712a1dab2d1a4649a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc2d8dccfa761b5cc936ddd38ebf13cecc9fb336 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82f5b9b0994fe353fed807e361f00c5f7b504c817cca7a0565ab9d16a988505e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..926a177ac5cf93b045941510c837677dc9739511 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82a16b864875cacff7f91e17d323e82dd136084926b8f068e12bf61ead1b71e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1d6c3811c32c1ba0684996dd59758e5d3b6b4c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd30cd8108939aaec8a33bd693891c109d681feda307f00b5eef809e4f42687 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c44144e9ac5aa8e60a0f303b803ecec3042d5ae1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d106799005f7577d87a0bb8a75acd09d12efa5c511e6c65ae6f8872d81193e14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e866ae79fd41fbb52e3c3636db90b11414b9c26 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12b1fa29749f798dba25b831cd4dc23854eca490a013ba6ccd2c2853b27c49a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a6ff4d47fa42235c23d7d7a56a707be8b95c23b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3b6ca2936e51fbe23854aaccf0c55792cf6e610f03a746f1526d4a818f20222 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af8cea8f250768f9d686d66661a5568180f82ec8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6004d27ec4ce833d3bd572d779ce6dd1e612b003d36e893b5f9578e18d922d5a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e45d4aaae9cf50c6a08d1ccba51465c9697b0ae8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ab01724ca306d29ea63735b258485779d5affbb48ac5714a490a183e80645b6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9edf66b7a3469e4961410c142631f35e132818a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0270281f49ada26f204563ca3b2486cb439705a3f2ad5d5961a9bda21cb1299 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b7d95c5786bb2756a24e7aafd9427c3fe410cf4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3990233852b718a879e19be3b3601c3141b82642106abaf4d5cdbcfb3de03f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a585468a10b30850d39244cde426474c0b647a1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e9aa1c7d1c761b5208a8ec4c752ac4ed45d3cc96ce55ced7231d882df96c4b8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ffef5d476a27c48c4ff640754d40e209bed63da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e74fe3f9374c560e7793637665a1f622513f061c0e515d01a51ddec0a2be1aa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93b16f6f302d6688a5e214e1e8acb7649c60a814 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8d2747c7283931b9f236c6ee7925d7d8a14042cc9d9fc5b4e3bebea6132c0e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f9575f8c9c9c44353131125d15957376c16df95 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d82826205146a36434b573805f2d54485286ba536fd6ad4ff82f819c226656 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..347e0c07cded919024e38f82bfb331d82f43b494 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65f4553764aaeac7eb535b5dbfb67fee599cd647debdea6bb354300a389518d7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..985fa15459fcbb9f896cddc7725dfcba8cc51fdf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc889fdd457149d0184db37da192f87e7315787c2e6994066bee64b43fe37161 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27df7e42515a92db4716ab4f4ece071199ae9600 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3d9cd664607adb8e43aae7699f8b8dcc59e0bc3cd628987564109ced054522b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1a241fd17413b4f3b817fae8db4b4c4a0fa4a8a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3fc12a0db1a570bfb6adf0d0f446aeae960cc53093a2fd5e270a0cb3fcc511e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed6b837656f3f1440dd1ee0c76ee6593b6113290 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:798f9e0ea51865453264a908caecf19a287033299dbc0822a343190c503623f5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c84fc76d4e9b8eeff5a851c57178254108a656eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d7c28610088311cef3031163f22c3dd6684e187cc953b8b8b169dd408d853e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..070674abf724f1d0644ab98b355732d34206f0bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5265867abfb071c7e745094f84603c5a451150128c4d36b8dbdfeaef3ef10f1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0befd0b1add2f63a40fe7d933aa1eb70a011a814 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9b08190099769cc06cf7cb4ef5c564e0f890fc21abf3c12228b3924ee7f561a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bac91128f2bbf53716492e5de9c7fed5cb869445 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8b4f6db2db9e6c53392be5679d145a12c08e5f100dec35f31e21ad064e0cf2f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dafc8d2077ca0815b2ee2197b96605e734daddc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab736828d72d4c23f28b2ae3ff3a21ee90c8a5cb0d0184433bfe6e16cedf7a00 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e1582f5a3cf75eda34fffa4a1ac40214ef11b87 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1808f4d0561faa600a1ea5cc4d4fe94d3f731eaf289b3ceecc7daf88a04ecf34 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03ac2dd985afd1dd7041cea2306d7ec63d204723 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:175cf8f1a92024ff9176112cc37ec5f5978acda1778cdc33df01f1e738179e5e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c5f94ee3de85c3a7b67865bc58086a5757b2571 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51f77e425d0449f50575ed57d4871fc271847f02a5e4edda8f9798933e5213b6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55e91e3a2f65652151252558f266a13f039117ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53e2a91d6df7695c2841d0b950a079522ae1df1b637a7fedd1d44391e69dd08f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9dba0da146bf2212c1f48448a98015a6cbb18c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3bb854209d573ad03ed03685e322753e0954554a8ab6732508423cad9a1e8bb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dfa08f48980cfa34e6f66bedfc09763c1e090e9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f811d381ae4abfacb5cdc65ad19724617b254de69c574e6c34a0f8994bb100b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9038ec55dff2497e73982b3fdc523ed6419dff78 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d1f73fdb500902e230772e9e676bbce3783c84fc704ee97261f139ac9afa413 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c8dcbb9e673d3632924dccf651c96cbc21697b6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05ce2243c34a62b9707df8f7da225d05a240fd2d2b908db254dcf0f7809dd1dc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7600cad10e6b2c451aad12fb252c68f624819a94 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d5b2ceb8e1d191ad5293eec81d124ab023f064641de05210ccbece5ab4a87f4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52e20e6b5750d35a171a1e7ee05102606b819750 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cde46bb306f2887c38bf4fe4e79fec7d21bba855690e52325d2e344bab4fc16 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cb9be7dcb688cd24ee47e58f3128e1e69806221 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cceb53f4feef04d2892cf6ae115ed75ed5c6eda3da44751cf67db41b24af69ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ce23e0a077540517de5ad956d25a718da4e7fb1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecca20fdc357f89d3de9089dba889f976b40742a51063fd15e7dddd369a15562 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cca29669c82d6e0e57b78fa8bc6b4208d8f77805 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a855fd16bb16ab80944f15ab0c0663a39d38111feb8a87cdc29886b7525e073 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..95a9e92664b0a2ac6de7f18a4eb9633229475f51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b01f5b48569eaf37aa7299c872736df037061c37e11d12e8d44b1597edfb9c66 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab92620931692edd7057ecc3fb48892b75576fb0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7761ba0a956ab4b5930b0f35adeb4478fdf0adf5c86bb81ed2b9e28a223927e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..871d295521969b520dfbe0d978230a374ec3a8f1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6f9f9129cc4f938ae970457e0565e51fee6d0a5e649a0753d1312362ebf03e0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cc440efcddd36e05c31824e31a961222d10581d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fec0380bf7b7cf97d979d7e154d7cb42184be0b18d5cabf6015918303852fa5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc2a6e72edbb4a0aa927b9cd5854af7bb6d89fbc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:088922beb4a62abb0c8f438fdf1f238a4bf94e2c3c13265b83e85217798f3deb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a82a517748df84bae36b433018984df27537b8c5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4083aa9ddd8b0cddeacca8f09edfc8a0eb353c2ae1466326229b16b6b52c06b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2c89a7040d91f15e8c6464852f0a7f8f2511f7b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de20120ac1d452002202a8566308c8d8f5aaf529b11d4059a27c197ee1c7e70d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c0f5e3183a222b55098fd6ab5fd133835f0f555 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2bbbbb56e74aa8132012df2769a054e6833b20a2805eaf0159af8f488dd2f54 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1feb45e642fc82d7a0c48959c455b8d146410548 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca46668e65d69c100e40fc2bca9ea4a271bc1a32bf8f8f190dd8e50c916a282 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05350e573c5682fcda0cdea6f9a668f2da20950f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dea89d6b475a129bcbc467861eb2fc3e39f5001485ee4880f829609b9700326 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c57731da948c3a917210edaf8103a55e5890c309 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef685600635966674ef3c5ba9c75a1d247be738b14e21019a74fcd9cdc476a9b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f87c98a42543a68cb882540a46bc639f650641da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e18de03e3839b76f06ec0b691f7568c148d7195380c980a0470d9b1ba5e96ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..01690191e354230fac6d09f9cdfc50cc451c6439 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f28f659fbc9434462a5ef54d447e1cb2b9282ed329827e1f4113eeda77def413 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54659aa65f0616506d9fb1f7dbd0fcdf9776d7c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e422f951f488f5d1f0a24db5c329a4e094ba05288e59960b2fbe365f32eb2f15 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75f69c4f7cd687bfdf98af21d778b5cdd2ca895b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb15ebe177fa80306c24ebcd3e949ae3d9714d465f4e57cb67b6eaf3136695d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcc8a5d227b8bb7c4a39b095e725e62d0434ea85 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:433737898bc497aa19e8830ae9398e470e30b684df7d6dcaccaac2816f27acab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2f4bec34842359af225ffc08c5b0be56fa71be7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a78b256a0933badd4088966290c004f34c1f789977be6728ad80c23034dd29a0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b61e6cce590f99f7e72574d3ff4a3caa32f5b45 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7e22c53eef215f6a53a9d9932081b7193779c9ee0a0298e60e4c95fceb0736d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae573600278c6ddeba85e6e6ca699ee1cfe828a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c7242d0c6325b620498315a2cc7791ff1791df30f52aab341bdd63e95df5a1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91d4bbdc1e58d143feba3e53f8784af3eb44cd0a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14accc994fa21c953ca0c96889b9ee2df7b5e82e6a6d21e421c6132c68a06f4f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28638b030b463ed3bb4fd35d4b5c8efa5b02aae0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:272876bbfdaa2d75361389d2766f777b15a3b3353c288751a4565e516c47d78e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c66f007d426387d23663c8aec50cfa002662e05d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c900cbb62e64e08750f2f4a67ed290a106bcebbc9b0aa4754c3b4b620d71842 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27d9af684085ed23f90161b7d4e03ac2ddbb3a86 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bce78c33b5353aca20a2665d1f314ea69a412bd41f232acd72246287dd40bab6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fab825a5c4e994d07856d9db0e781a08a7afd65 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bca8508204d07445406bb0c6b401252da432a1907a9087924a01e56df4c8697b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6813227f41eaf918c9ac1cbbdf7e47a97f0c6618 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bbde9354e2b18770d5b1fe363a0b5981c8b03ba52c2bda6270fc5d0f517b9a2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a1db48635f123f1b5a9cb2ca70c07834ea5b278 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c82b6a66a7e61830418cb7178015ea5f8769621395911eae3f13daa8c052d0e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2ab9d47aba229ad4083f0ffb518d23dfba9d2f2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e7b1278ca04c37007041613a3fd1e7f4ab40ee0dcffc1fd7ade27d1361ea9c1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0485e901218441b4a96cc9190ae6cc1a9e8d790c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02be60506533ba337bcf998d01ae57bc56a0586b97c64b78fec8859119f4ab96 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cba93c288348a0068d48d68e8ea6915d7a4d0678 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26e8560184dd7333002043a81fd58e21b651d4a74118e1abf2278d04ddc03dd4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fcaad36c940008a88f6032cdfdf71ae4047e75b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7289fd99df6f71ffc0734dc4233f6bf591ad5c6bbc8f24299c2053684bf85c20 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5f660e18cbb46aa28aa22939711ef414c33d1a0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6bc8abb415ec78dffe000a0869906c63e5c9cacfaa8536eb58d1b9ac3273c8e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1df15c641d458b6272937d624b1fb9c32e739d02 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f9d9ad08dc66d073ac36162f7c3923886f9423665d3c47c995207e9cb217a46 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3746ce329a7f07a455326b3a8318cc9c03c0780a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5245dcacfde14a52860b441fb360644d8723224f7c582713a49d0cee36c5cf14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b474ccff59288ccad60c4c02facbc3c00b3d4049 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60f2e20ab0bfede406b161078b5dc17c66a02584a81fdfffa655a3a368b19b29 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96aea624a93c3739e78afeb6bf8df5ad977cacd0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:130d2bf9a9df29dd35d9957a95fac845e636a8d656c708d422363d494e35540b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b85b9308a12fe69e2222f02fef553273a37bd23 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03bba0001d47337abff52d72ffae24a1fa095d44a462282e98df7982f5a69ded +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ebe12ad604d350eea32b89094822f58dbc58c0e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:852636ce55c963d6212760010f95ba089f4f5915c44c125825b632c0de31999b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d8799ec92debee203cfec7f99ced983babcad24 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdd00501cc67e594e89b34e0b38395845a9624725c0d7caeb47fa1385a0940fb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1e5f0bd13edda0febd08fbd410a186f767d56b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ffb12a5f828c7b99533742d68182f5c10f456bdd55e014e38801d454ab3b252 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47e1d90f8564f1a83d385192a6357c4a7a00b01a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa39bffecf4beb0cf8a8b99ad124cf3ce45a65eed669d17efae1f5dca1390753 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..757472689e13994c6c85e83f820a7b778cf14b50 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8517036dd02ee271fa2696b33288b7152a5891145e92f62d15e78b3c9cf13504 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30546cada2881639353948955c8e5c269d11068d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c21644ae274839c2ebd4aba1d7dec9f1102e14af5355bd92d48e80422e5eb61c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9263703cbf5c4f4f44125aeda23e3011042ca5e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f1c6dd44d835c7e0df9315d976866ef27b4ed9face3d0779424e83e327977ad +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e96656c855c16fdb3a920d63d52b21e743186b8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ded6fe2338a3f073fc7ee24305d14c9f642fd14d6e88306410c9f5f16d2330d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..286fae7129643a809cb1a8734206e7bd781f0235 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9008f17790a118277af1715f9ba29b549decb650c49c5cdf8d26460bd404da1e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66100af17d0c4b801d2e9ea94762094c45e75cd3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04bd3591346840dc03c87bea1db0d96e2830d775a707a05592657587bdcde116 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a99fa0dbda8b059f28eafe8d9d81d218c790c42 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a416a20b6d1883256336bf837e33c1690be2f933aad62ab88e67787c7b581b57 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66110bffdef03f3401e841f7c75c8f59d1fefe21 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5448fe925b91dc30c0745584afb0952ee9eb7d6c2dccbeba0c3a5b52e82de576 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a0ed5a813dfc83c5644f660fdd016a209373150 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43eb6b4fa71acb2b421d745bf9714533f840d7e73646567935f3d7c725818195 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e008cc30c011ce3f1e3056ce26f38c4a0a0bb61d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01df9449f64415e082176455875cb5965a7cff9d177efb5646b0933e34ced661 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be2868e6f87cb33cc82d0b53640179a86dd0133d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31d58451fcfaccded3beacc4df42f8bbda60b77a9a58db45464675bcb6fd66fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d321d6a061c4bc11a6f339d9e49198f449c6d0c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2da892fd4694d3c06b62d45ed99f8e096afd07913f8c0f274927f2da41dc9705 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c755291e60e3330d71a3ee91a1bde3d49dd3a13 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13533cc8eab2840b3221497e4a6262090e18546de0d84f47c1c89a6dbecdda0a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cba5e52d0169b8bf3de938477a3bc3795f423a1a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48f913c4f1813c1bc63db3d1bfc0bda6afffa0d3ed1963af213f1b03341eead2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e99b11abc40066012b70770314b15f7bd73cbc1e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f1b83417f90a106bca4dab8647535aa35cf841429a62225587d70376a9b2d3f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60d047b38689514111cf8e57d84d9f3f3f76d58c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ebb06adb976c2264bebfe83192d4ca973ff470e99b62103ff4a7c907775f96f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b868daa12367280bc21b4636661170d7a54ef15 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:766c67ae5665b2622c43e327b9070713386b6fb9e6d350dea455eae45e5c4075 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3073ea10a75db7ee571fd2e05779c7f64d504ed0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292fc16bcf2cb4422e6045453f5624a40a3ce72d43f40392f4a4d6f5da1f43b3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c17400f8cce2b520e7c75b728d05317dbc1859cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a13fca86c0eb777077fef379611c21a4900f045b54ee98e819f2724cf810dfc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1426790ac2a86b796801cae64561d1de655887b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971665324b4668b031d86cd0cff5c82846433a21c155fb902aa6bb5b2597b105 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f58648aa1f48439ff1f9161ffa6cd07cd0bdf63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb2cdbd6ed17971eeb036f7198ebf7ef8e540f6697306d8fd5c13f3945c8c14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3cd456ca52e3eaa997d50094ef680db85e6bae1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:116402d50184002b82cd5ff86de43cf920f7b4136b0adf68276e1545421e5ee4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64ee803d9b937d314d222c1eb27bbc007c44fa2e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b90cb37584792ddb132634ec24464090595f559ce3d6e0b2b7ea87d30eb6c81e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4db698e9de60d9239f02b702cd65fd5d93ba7923 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2552676818308ef202fc8486a89c6271cb024415beda6227addbab3cf810cce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ca29c0b951a76ab48a3a429efd01e0667933d21 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8274884f48bb490b132bb0f2f6ecde382b1372fb8257dcf0a5beb967b319ac6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e41cd68364d5132be0ae1dcbd5b06bd3d6bcecd1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61ea9733208633484302698c981070f5464d641513ac67b1b4204499f5ebe2ef +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7d0ee14a3460cb003ad781f4d7b207af26e90ee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3fe286264229abbc9745aebc3d1579117467d38e8b6f514408307c3a639de59 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b38d681a601428666a420251d96385cfff08267d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0280d5acad94bb896beb4b74a149d0942f698ec07f4f58db5987e2e8d448d35 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dac8a5795ad7c5548b300577ed838cb7ea7d2a4d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:436c3c1d5e59d056c815b836bfdb1e7a5ae73a4ab2f7f26cc61d90727bd8ec31 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9ab0a0683669183c8876296933098218e9bc806 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10992dea65cfe6824fb055b82cf81f4ca68ad13b1aa6d5efa1561a5f883a8d10 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..599dd4970b51acd822da5b8a0a1945ba83ea72a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08cde14d609bb7506ee9512a0533254f43e7182361d9a0346a756db928117594 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad1d3b3c367c65106c78a499f45cc093d191eee4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56533267edc2d247ee74ae92c284301a2e13606bec29457e0852eff9cfba9239 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d18518f171b9f57039525e64daaeeafd37f444b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5109a44e77d15b47c17be8bd15e937594799392a19e304a6d8a381e0006a75bb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..518b3826f04bb7102de153b49ae5315486d35a67 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8551b88555f63041c042eb76453f3424a88066a79b5a9d82b15011215c00b91 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33dfc5aa42638f24fa44631365f754b73bc36dac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a822a44a37cd2d62d4d8fbb0262e793145e7cfde592c81eff450cbbd6b9ff816 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6129ada1877a2e633fd06ee8a56e1a20de81fbb4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5d118c79664a72a2f3f820ef187b10ee989bdc261afb93451487d4932afdf05 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..262efea184c513717ae323a07016704db7a43077 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7820d5b4edcbda5eba43c413dac97736a2f0fd1abae64743ddb9b8d86e63938e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c641e5e6c6c79296dff7688d619dbad9d7de44a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ca837f28eb1435773a06bb81c8fbd2e2cc88588036b38c57d8669c9fbdc54a4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5da9e37d08519a4731cd5eb6605126055dff4a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c066fe09fe2f95e94abd6799fec7e1a6420910fa235676c924125ef7b003fe58 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0cd2762e36e9752c0e66c555ed863b6d6543b81 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eb2b19d9b2cb7b1f97bfe89e5ee67730b1cf9eb75166f3d7acd435d561abe4a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fe518bc5ed153c1aebc750e028bb54fbd7460a1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:820c311eef9c8f195f82e0afcb702aa6331467a0721b0ca6e532cc27b3982e0e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3add7534fd32a1c7f6286d4ba2f920fd5d39a87b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33bfeda01d2b5867ae108700a00521311b71390862a5fd855e50eeb78e69d144 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7271c48132512e659c72e1aef5310443d09901e3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc5d2fefa6cccce986294a7833c023df7c2d6768f1c481b6c9b70d78fe6942e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f72e61a0701bb55a823fca63fa3f068ff19fafde --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a16b43090d374fd63907d76dd4038bb971171d72d0b3a9de2418d63bb1a2882f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..938d88db3c6179f099bd74235cec1433597aa68c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3975b916c4defed5cb8167437ab4505d369233ef6615416f1f5f020e62b19577 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2109d951eea6339274b113853e05ffa70fdb372 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c3efbf5ba8c9efea5dd085567aa65adfadb0d0f05f02e17220f8372955e97f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40139d22d9c2079a01a683824570d89a94f8c6c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9683b3e7adcf1a15ecf5e5c533587f79807421110fcdad1fb2139b1403bca363 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfc7cc9c9f77a8cb726201ebbea28d63bd3b7637 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76618176aeaeb558ae1feefe894ee5473b486448abd12934a9cc49a6f29a8c7e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c54a8eb16ef09222f7756a53e09ac02bab12780 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb317748e5df83ba493d8450e92b2e60ebb52bd6d32eba1dd1ec2568c7ac3b0f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68855e9c8e9a0c69471d6eb62583a03677614f5b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73451982912fc8e0b480826585ac0f8a0e12c1064221e4f249f162928fc325e2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dabaf012144ee8f2b8965c63fc9ed02dd1520cfb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff92592de249756100e55fd7996af88f6e973816b7d9dad44a1ef1281e1e03e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4464ed86f76d6e3d152658bfc4834af665d9ae7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1826ab8e3ce8fdbb6a29b80a6159b19ceaad242076e304e8c2718a48ebc0b6a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..194b1f7be8b6919f163b3635c9851499b3d2814b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ab7a3ea1ae12054afd29fb10219ea0be87f853f8a34bd99479b09dba71f8bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7e23b0bbc1333eef7c953d142ec3c44945c4d81 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4da30bc3d2865c342346ec6b47f1d280b390c36c560163a68069643a451df88 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ec30b718c8f5fd554f216f7afa64ad0853c31bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f81e132277624a62793d5a6f0287d6aa77aab13cd7b459a4e0178a675aba8b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..694b1dcbdd4948a1d4b64eeef4ed39f1a2ac26c1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b28c6e5ecf91ba2666be49052c764b95112620df0c97684fdcab5aff555d9bd8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f53ff4fb089b73ba521a5342b86ad1f1bbbe76de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b3e0d1b3c27f186c563000d9adbdfa79029118b3effa36aa8c76aceb88a552 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99993a45bb0b265c4fd399b938ff87abcfdec207 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01b83b6f6412da7b4cd8e8c9e8e8a899b55699cd4c3c366aef3e6f839285211a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08569dbe9ccf97679d90b568e901d73bf1fc0d0a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8a106153b89db71e423743797b6f4c52c45d255f1177235f31fee55a31c7411 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69f8a021d9c1c20dc4581b766e86ffdd3d519365 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af04dba5bf91d00766612f994b74a31028a358246320f8e85a6f753df678fe75 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..615181c2ab26f063e592e707e1588267311ff81a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc87e9778c8c72b0dc4d9199c82050056310b0fd1768f70fb1a9ede20e43b16 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f1399ca81867ce1150151c8e92d39eb2b019a7a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47756669b4d3db7498c57353cb670722422ec9426a6898c0ae7168313908751c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ab8fa5b80c7318641c6240871b56dbe538f98ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93a623fe73be11df974cc858dcc39f007af9ff1056099e2a2f859e8cc829a56a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aa5e364463c1907549cf5caa63e1cbcf224c37d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:768cd7f567f6a3b482e6c5878b9b889923c1be1540efcfa2db47089111913cec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e18988a230ad480bc87386685870b0f7c10fc155 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee1788d52000c44141a585d279cd7c0331d3f84d8c07ca364bd6ca9ae4d42c8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4633e50b0deac7070ba8d9fa357044f973e2e0a4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4b7af78a7c27f0acfe404606d5ee4ff1ae40a262f213138a43a2c5ae79985ed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccddd963450ae387d76c61b4272707a495cffc86 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:767789e810f7b34995d3461f92ba36f900696e90f79f2426c9335207eddcc3d7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4fe733d5a4375d9e144d7db01924d6c207855eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bceb038d8edbc4da553311c3ecec9a236b1da9b586372029b3f4ca49c99ba85 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..635c8af4a559a351bfc10367f4a54103741b0223 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5599bbd30703422d8179e95c59187abcc3f4c0548726b220a5945a8d2253dae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..744acc99fe611699ac212cd2e2de0eb29bce173d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adf6f0d64b085cda4a00d1ec65479c2b9f5301f3a050bc2bec7d586f6897814b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1e93779060dd85ab8b90b496438b0514a591f33 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4267f58e0db3306042340c6d62b4c8edfb18f5ce429c8cc04e3d5e2b5560287c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f079c81f82154f4c013ceed79806285ed7b77e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aee5a5c965ea29e7c81703a2c318933e74a411c82d995c404d302c23767aefe2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeb3aa845a9a177cae00688a84808c27de90c6fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:323b1d9c14b5dd1cb0dde9200d04fface720dda50f1c791786f6d2369cc1a798 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..192f385266c18ed3c2be283cff983b33b2e391e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:239c33cc85c9597f301060095140a5ad86f70e0f91e8fe76368e78b3e4beb6cf +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cca806c6e2d323efadb9ebf7cbe28c7c7cd393a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f79963f7285ca8d62ad196f895fd0660ce9cb3b150294001148e6c8ccd8c7f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79d1f8304cd54bc9ce20071e363e84a645494d9d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e212093610f2f63aff98bea878e745d38201fdc8a985dba7f4e9847e1f6313 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bb863e68dff6f24185eda526fb605523fc34611 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:142e3643b8aeef36f9cc3ecdc7e89627d9d6a06028071cd30fe216e6ca88037a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a43888e73356281c984ae861dfccd7adb7350d43 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8908c2b029612f96478883753d696ee74cf8b40567a64637037a04a4070337e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d51e4f9e549238c690343aa20892a4a6d4e38131 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a0a3c6ab7f9b1911cef1950564ff95f4464b0c8f797631bbcf505f08771f335 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddc76dd0eecf6d65c72842c19de6491c572c8941 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85d67a46b350caf125b559ff43485cff0fbf43f18f8998eb986cb7aa25e7b5e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..633a3bfdba11f6d2b6981df43d4d4349e6da1579 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:225a8d8842dbfadd90708be4bbbfb81a07ddbff381bc71b751efafa478d0a468 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0350b86c61d5371dd66c0b568133cb7afcf7724c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68af13f85102de2e019c35f0c8f7f995b59048c14a8b2f1ccf294a23d35cdaf2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf4caac25b096c4a412ec7323e2c5e0ed1601922 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c29e7a295c15fcbc0b07d73a5e629e3bceaf1280a073a94708d8f526cba61692 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..109d1a27ee571a551f71adcbaa1e043bc82b1568 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36eb4ef95e82aa3de212760c0e760876b985378c364d5a0fdcfb77858ed99b47 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef747823cf119961aee06d3c7ef2d6fe836206e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4d97406010ba5fc8be94ed3989f9c41f8722a771021ffea1ed9757595d2fb69 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e49bf345fb59e68301a24bb727a758cfe5be28f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2fb86df6d31064462db72e6254e85a85d699de1f7c79c1b7641e98d14c9983e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..76a947016c6ba61e38e2457127c996d43210a980 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4ebcc806d8153d3581d507729a179a0a4e78d99b043277f750a90237a64f72b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70234e3803cccfcc8040632e70025b410a3c478f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a93dc1a56ed5d479a39e04929520e47db94fb53a46d9a370082687c03cd92ab4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6fa2f4c71b6ee69a142690684c14d3c0bcfeaf9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68656574f6d78314cd68a83181e71bd37e5bddeaa90ab511fc88daa350783d28 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24abdbeb571f8c489eccdd8b77dccb74d2d944e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:673bb6889cff209fe1a43ba71ccc7b361b4228f9a33a3f58a4a0909a953cf06e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c3d04b1f626f2b4027248a11bcc419286b0432b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:653b2aa2eb83947b2a082ce7d00f16d5aa0acde447449e5dbda25f570f6fb315 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ae76c92a6b6d04da933a90852bb5b15bc20b273 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ab0a23771de0026fe0f8b3f987d47949aaaecd192b0e13067a8d9693a25c11d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..880578dada54042b7f8f475ccd09719119c3ae8a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce72c574a6c30bed805c0e1107f47c2b2f1745a397e41aa664dc399abe1eee07 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d64c602468ddceb0d64a5a308eb282699db04e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4997cf92d7b915c2813458ec5165fa0478929f2c741a14ee6bb643fde8eef6de +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e32526381b31fe3d8b35b138159764b1c6115b0a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fec69114a5766c6412ff2b53612b554095fa22c4039db64ba3e48488aab44631 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..845cbbc6243e0508bf8872aff9369afd61e5939e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f40ece0d8950cd47daf5ee77cfd1dfa36d6278e4572cb4eea6b0de8f7df0f3e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3718cf1f5bca564812517ebda6fdf6cefc94902 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a408e320b5535223fa785458f5140fd6d89e7c45061e7054cfd5f274de03913 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55ccb69e0dab779bec833d7cc42d58bde2e5833a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d948c6fd926588c6f052020e278bd5c1f0e410fe7ce9ec09c73aa8b3da791b8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cbef66757615ab2661f5b9cd1ba21609cbcbfc7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db23afa55353f8e9706239768c9f43e5192532115ee833e922b2472514e83559 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46e683e448ec145cca18ef09a7a21e1c37163aba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58103812ea5ba148f7bd3a70b37743d31a5b104765b60912235632c215d123d8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aa4f5e7369043655853ff2696fed159be4366d6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2db2890678538b1cf1aed77df58e796f3e0dfd830994e02f5910e57a647f822 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4588cb7d755f0f44e8a470e3eb7deb91b1295b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd6955dc23397b931776766a84008b42c470506fbaaa1eb06cd7e272c901f49 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..013bc9799a47e72ecc744a247da2c6179d8ccd89 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84111a0c9f05720d921bf05368562b66b26af29e2e0b8b7bfa36faa7766f8be0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fffeaeea78c3613027249939c7b2b5bff97c7049 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33ec22301fc4942d86c3b69ac33a8dbb2588e637a88b15a0df0a281ee701ff40 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4844789c96133a3f41c369849def1b32ec21550a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:377e7257b5584bde9cd52f0c29c3b1ffb930a8221763734c7b125d989ac1de90 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1e2a4f9ac2f45b4b5c380975dbedab9de32dbcb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5e8cc8c78023e1eb2e44f547b939e958fe1e442e15bfd66339fde3b0c9572cf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d52b9bb8450c2ba76484cf64cf7439640fe1cf4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df811bad5d4fb366e8b0636f7b243d81d32abefe138031e26818f1bcc7788752 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb21ae78a544bd9bf04c763738e98ed628e79856 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca846906bb218f9f1308a5304f2981719d415139fc29acd7c70d0a77e0927c4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63161bbb58cecf860e87891b396a9f0166fa8efd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f148ca0e438eeecbc9f8af96c716c7975b223a8f932fe966b8c0131e90e8d68c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bb34baebc0196a4bd1b1b3e642f92f1c289737d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0977391d6193a609a109a94d631ea7b7e6ee96dce82538ce016702f38676a388 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d828f735dcbc6690cdf7d67acb3c0aaf01c9df3c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32157fb33c64e339bf2e945fd58145ecd89687e78b7926d3d6d3e8acb3100da7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b7bc928a9f731f45469c393ff8eb184c74ece37 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0e8e1fa16eb0969de68f494463ba02b2db9464580f948e7f57af7ee97517602 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cefb02f56914882c227a7145d65342dfc1a2413f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a13313dd4d6bfa81196b0d3308de01e80546e0dd6487abdc36a7784a9fb553c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de263673119d9143b47221e9904ce2f590764daa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b564826de37bbefecc445ed91d812735451fc86b525f1d4340f85487811e4cd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ab2b0c43e81d1e58441136caa445988a0112126 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93e1480026fb6d168660dbc9f7bbb98e9e412507fea3483644e431146b461f60 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..528caff4724eca5e8fae36c8e587f6084fddeb4b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b85e1bbe0e4e56039e90735c287d3ede4f8ed076fbca1375f678d76277430e48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3a323166ef6fc57c98bca2e70f3895bd275eef9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29c1df077f3a76b19a6de0e913ae269a1721b30b5ee5f2f79bdf12d09e1112be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a92e18be1f8dce93e903b64d2e544aff23deabba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:718f1911fa1b7d1ec14a07e1390386b336c039288e2b8dd35f1a4028777a13aa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dd10aa4f9518439dff188c637effb2f68bc7c41 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad8f63984abd659536b00cdbcf4b36cfab00852a56fadc0477f41034117161f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..225cd9246a009b1e0b550831a3edf1b35e4df0c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e68d7754e35fd38e4f2f2f61f72c7ca08af830ab2cbbce68194b8f61f19935 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a664a36b209f602e1fe0666d7951f7f7103214cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b55cbf96a9254176a294d3002b0846cee6e49f9d979bedf0279970c7ba072c0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cef6d36efc19721f623aabac31aa03e8fe699c20 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da7ff1266ae865dea21e5901ec981f13f9b01a7743d1ff080e6c8ec3fab10bfe +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3926250abae22c4523b9e52a92a5ed5d0e60f4b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c2e1a6417c2d5dbd4acdf11e6586c1cd1ed1b070a02dfb0a140281beb648a75 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51fe983e727e562fee94675844ba5ed8106eb74b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90563251b391d471f904ca7290ce66602ffdee373e9ef323a1f3ff639e962919 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..420deb3b1d438de89d4db8dad867f4b6c50276fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad97a1a6194f6c212e01a25d9d464b6852085364670f03c402a488c16ec31f83 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b70f2f4ddf55bb7f3661fb589958115443afca6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2957ee4dc643a671fa1545353f7f9f19d237379bc1c5df3ff4a589ce78818d6f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc6c334245a377f3b3b39a592863c4dd95481eb5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14533193321d8394f98786508476d5854f3968c66d470136a1482219129e493d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e474c44832ac704fae1a3495b15ab1ed897460d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22ca9233b401a4c57836153de473b045dc09df78366915372ec5f105b71e72f4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1696f5863d6c0dc5b1d0735418727de0b111367b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe804736fa3aa4d3d3835f8387dd67180816be3dec4a1d9e32d15bc1322008fd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16f041b2cecb24dfba55fb6471cd00a18462afa2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4e9437601f08e418a4ab9d4bd1d10478fb7468241b19695e38642cf7c23c839 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c021fadad601a54549143c5eaaeb3dbe634ae11 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90603d80983fad3b1a5434798dccb30349939b057c35bc00e58f8b4d1755e2a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03f868c7053a9f9309897fe56badcca32b4e6a58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ca57acbf630fb200f9bd76f37922ffaaa74ebd5877310f5718123795909de5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdff72e7132d80923f1a3aa27678b5ad1e1d71dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c93791f16301af347bf5107b90cd032921cd817e98054b8b7ac5f2dae453e59 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b68126ce12534821fc8bd0dab76a47b95b290671 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0454450a7589b9305b21344eae4d5c59d638b837c86a7c57305b6ad0e6ac9651 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc49fbedd517591a6d56fee5e1ae9ff504faee51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f237413dec67cbba75923ea2fbef446846ae322e3e7c3bc87074916018cff8fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1df06343b2923cfc0bcf2f7a453e4de6cfe3fade --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f01c92b4a4eb16bfc80972b8cbd3cd8d3ab417851d7ed0294ce2376b45bfa79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0a85c3b2c979892bbc8b4681791a1bce2999803 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c0eb868ca9d488787ed5eb61a72e200bc7c9ff852742efecb3cf533877a6f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ab79ec920f111033e526314a8eef578a8dc614c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57e0cb572de044440e3e934ac7907a39167e63a1e7e938b3307ba7cd9c187017 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8dda76017e80f7d465d77ffd0930cac178b239 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f977e0f8d57f9277adea586e44b3641456f3dc7351b806c904aa5a173760f3b3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98a695cbffa9e7721dedea7e368561af1a8caa58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:722275243f0bf8790dffd4e96eda4ff66a91605afd5f5cf6ed13962905262286 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c933956889828226d34f32f3e0bf4cf2d452537 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458c64bd69693313821c3b3aa531c779939457277f5c80d3c9df805974d94f01 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b46969a135c399ddacfbb3b8343259bfc78c445 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4df004f88f3f04e176e27d694a454936e39b41eaea7a0c91e8015331fa60f24 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79e7be14c9236e1df265c4f77f6cdd3dd43aa2e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6850ad76b5816c9e5e970a700aa0802114f78f87001bbeef03c55a3febfcf6c9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c53fa3519a15a68f4e8a1a55c18b2e48cb8f6bdb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f47b23597ae322ba7ae12bb363425a16b81444f0b94afac2e1ecab3ed14d2c0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8d5948c38fc5695534cd57c87ffc7ed0b437edb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920a0b6606ad1f9bf54321e362f4ffbea3aa8f31d18436c74f2dc098d35b36cf +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7610ba6ff8c6c9aa1889a12d817ede56fbd10a15 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:245406d9b5d247090d82cfce7d9a7f2923a5f03c7a2fe83cafe3d244b1e67565 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e892a35af5a59bc27bf13289f01c395943da557 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3345726681b99c53d5fd981750f4a3b55ede57e89df46ae55a1e12d3d6949652 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d04dbd1b05987aaa807f4c84b9a65b6f2fd23a9d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c191ef4914453cf4125a1f4b42baef937eea83dc0874316fe5fc71becb95ca3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ee08206aed34bcf4e839370df96abf0d7c1d59c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:711a9d9d18dff3c3edffb31d22cc4f929d38126a78cbfb05f8cf12798eba0ca8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57ab5f46f8d32bb478a47fb143878d19d444c0d4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1352781320cb0d931a86aaf682241d662aad4b4a394660b141e45eb5c331e17 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0aa8fd956aab06742d8581d114fbca6949a9e7c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:820c78e59fcf1f94e17219b1c9755be5e70740aa40c1a3895b6e7c97304bc89a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b63bbb88704f3ea88511f0c2cda8966fc3e84b8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7c50d235e6ed19ba5ec1c7cf0f46f3afaffbcdd163f27c863a815591f69fa6f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4c7e09f1e1d05f931fd4168779dc0c59ba30e0a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc6b63db717509253af4735b23127f75dce88a49f10285916cabc0c136cbca2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b45d057e60bcaae01d9e169adc2b2363b4c539d5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13b3c9ff546b2b10f0f468c9243491c92f745172bd1375781289aaceca089445 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2b7a7c9acda5f7ad3fe8394f98876b98aa1dc4c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b582e9819b489ace7b33d3b7046bff2adbb2aa43e32cb5cd54932366ebb928a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad700a635829007d3995811b1bb6924745e18c5f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50481305cc230e2bd5459bf64e2b61d83b7e6b6cde84b0eb97c5908309e08339 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92cc205f0443231ca77d96bee84cadf166b88fad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a1be99025a3fd66cd0586ca2e3ce57b5edfb6157c56db1f6e4ff092b89a1c50 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82c77fcaf4646ecb00f5b9b978acb20de2e5e25f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce540bf3e778874ef3e560d3567fa2af0043620367d2454c747e4e912435da1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b269df2313dbf411b470cb56ee11b7ab3f50f750 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b0d06b741ce575526ff736b4fb763e3c363d0d71a8f0b313f398621033e4984 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bff91d6e01290cd92f2556c607b5c3e82e974640 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:560a45f9a81231c85ab97b1538e97aa5bbda8dc7f1cbcbf7c04ac53cbd24244f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dd6cf2dbc5809cef0545daaa4a20317664300ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5396879d1c1f3d20dd21ee8655ba8689730a2c1f01d182573a979c1cdff5f876 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2fbef2ee1e8f03707c298745f98bc02ae808f46 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e84452996cd38cabfe908dbf9ea11d7390066876c7ea3443c76c307a4c0e09 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f56638d4c33b2223923d35e91b9d17f972b4c64 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c407d90a16a009b4dd7b75992c105a9589c9e9c3dec4a5c15ac161a029813e73 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ae57150056b565d76d1e9d74972df8bdcc57e73 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:896315115fe63bc3c67b6626d16650a3b5a407d878fd22e617bd325874c62d55 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f83cb131a4ec12427c57f27c589a8a305557de9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db43a7f0ea3119ec3e51b18cb8fb268a1f69b68110592481ee4ccb3676c4f8bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e780558a5b80dbb13202c37b0834fc8b11f16a36 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e83e47d3d8c3f921e09f0495f068eef0ba8424708c8a2a66bd220b08dc8000aa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f5bcda8aa2f92cc63b849539acbdafa84ab9e2e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fef82bd13194fa45b1d47f0468ae9f3f76ace0a3d54694b7fbe35386dad0d73e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f80e088b6256d707b7f588a13f2499b366685c1b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:121efd5f3f12d4c0fe3363eb072cca17ae500ad69c03a602404824949ade3e40 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cea9ce8143f494c72fc5a786280cb61964440a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855e2c273bf3a5dadb7b3fc55fd69bc3bc004c3cdcc9980cbfaec910493ea1de +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7ec9b2a18776fac0ed09fef3c293d74b44ef243 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98b5cb88ec34e95de9049c477412d6c642369a7cb673e32d39dcae4aa071cef8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..24757cd762f4f2c15da7b7ffd0fea99f663719fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d5807615c5d936c5ea46a6c1b9ed5af45381006ecee0c82137c9b7569da264 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..876e3f5e2377540bcd4e65a4bb149b736dcea964 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:614c872a477b3989a5d0b8d2536ad4a9100fe7db40211851c2cd61be2f28bdda +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..276450967b35f8d3263412a1e5c8e0c66ed9dc5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e39e460cc123516ea3fd6fc95816d365d6e83f4021a3bdea3809faf0b8f1b0d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce2e661ac3a07ff936d8862de9722fc407f47039 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6507b6d7d8b4f44fc31ef037b258cf58074e6f555b9378ab1a10f817c590d9a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2c94018062fbd6a60d65e57a0ee0c4bfaf17298 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f92ff82059f760626bf19ac558e331253d0ade9aa531ffb002133f1ab6f603a3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5f03e9dc73cadfbf65f60992815060e0f53fa7c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e96e60fee1c8b8e502971fc3d8719aaac887e0f84b196f711882c6238b3af455 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f411311fbf534783e794d8482d672f283b31a6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73ce9873939955e43f32c0a6fd78b59a7bb575be620664bffa0fed87ed66692d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d31c9ffca3b4ea7628b554d908e45ad6d58bdcc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bba479d543796a72c1d6002bbc3f4469e395721de5ebf0384ab23cf18495a012 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..16838f6cdd4b26f4810387bfaec1075627a5e485 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2beaeba06e33318dd521352da0f792b0ea8bf4134862c8611adeb6cc87ef358f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de7ceb25c8ddca3c7cff4ee830078d194f91b66d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d2178ba45ce6890157c963fe5e8f5fc15958d237695e3cc9719d062a67dd50e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aef7c0db221f306159f5212ed4b5ba44ebd57f1c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e3c461178ad7bbacddad0dc7026bdc3bdbd7a8815154136a1a4338ab98c3c7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..973b15d2c8b655734a85d8b45d7e3c3fce4ba763 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:317f338df4a6ebcf2fae5f7ec597168fa09fb68af78a764581f9f54e757bf44b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2493104257e9af41aac11eadbf69e56fd6fb8a3e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8b52a389f69f03e495f9eb7aae0688c6ab9f3ccf9ac29d01631d1a776f7028a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f17d3d71389d018c8916b35531d0732e19498b69 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d45432603731237a5cd6fe123ec42b37ac31f048ef7097e0df8ff5577bdaa2ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1888721e02a4a6473989dde22970b7dae156a35d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c51df046e2d16b2171cf944ef04ec276fd671f4d03b74b3545102082e5e20fc8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63a6c74b5461f40024c96a411d3a2acc0bc25b3c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:574adf7a7e7cfee52f462c96137dd3c5c3361d9fd57c96b7eee7729c837cca72 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c092f6906c573a3166e7c1e9e70e770d95aabbc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13cb1c5cf0691affaf94faf8b6f664da7c1d8880e6c343073678ccb60e64a3cc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82bfc18365b77d23821ca39d132236a7a78e80e0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c6d0211cc5c0cb7348d23ebb3a96442d95f84363d8e1cc91016921cbcf9225 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06fcfdede61132cb528841254dcfcb3e391caf2c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd39edda8f9f8634a3ad1afab0e2d120b7e6abd11ad66c5d63b88fafec917594 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a2a522049ac31620c2d06ab392581620f19e3b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad1e3daa1788b3a0c6764d919f586ac79906357e1bb007c7acdb2ddeb3d48bff +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c89b23ecd26b4ee236cbc3894889498b8f9ae5a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54386935add1511bdd88a9c34ea6584e21bc67b275cc1f56f6c9ee3252d798fd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..218553582a32f6bfc3dfa1a37b6e8fd0340660d3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7a36feb89e39948aa258f7a34c639843148bf5a5f883f7c64c97ebd2c14899a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aa46b011c27b1611ccf4c6d19f9158f0c6ccc35 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df803b839cfc000a7e36dfb972cf2cb6a2cf7f4c6f68b4e193cb6d15e543aee +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce5b57a99130424186cc9cdd949187bd731f0108 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9488af3af72e7de2d7efd22e822f3bf38084769ea68311bdab465fb85eea4ba +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcdc5103b4aad739f6d75c74f774f49b60750e29 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13fe25a32c5c4b67040a9ce245915b574c2822c2f1328e11496733c0c0891a02 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe87473e099b95c32363a9a2ae3a1abc3d1b6c5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99a5b92e3da105b88e018e2ff1e18887b93867d655c056f775d860fae2329e91 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4a24706c369c03048edc1512c83a0d3b2f0cf2e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:718263ca205e3cce6abc34a790da8cbb4a75ceb9b830de5baec4e19809aca817 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29266f8dc6873497762add71edadcbaec939efeb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8b97fac6bb732d36e79a139e173a7a7cb2de2337832e12935454aa294cfe4be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eca6da09a8ddfbc33efa12f9624271aaa9e690b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dce8903969f748ec0292ec5b1ffe618cb890f5847be8e2573757b6c878262f78 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e081bc53927ea9b652863147102be038887ed804 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584fbd9f465e77030bee442d58ae78336021498469d9f4f36a71176aadff7769 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..58e94965140a8dc4643d9d38182c5731b058b606 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb717d0b6f4cc3ae49c30009fdf18106af9875a6c548326728391bdf4dd148ff +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..528275afaf39375fe434e6e4a4ca3d5189f35a63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d4b3979d44da8f405434c338a3b94a7ebe238d1079b6267eefab78466790ed0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a78f1fcf8004284312ed4a1d20077bc43aa8c16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8692763fcccb635173158880b6d38bfbfaccdb457695e9682818ca4b90e2a717 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd246975b8c471ea6c381d49f3dd0b665a56ace1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:880d5720719d0a559bc4997e57abfaa6cbd7dfca62387d2bbfc598050534b329 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..41dccfc78615e8bbc0d2c81f8732c8eb22efaf72 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9a769388c086c755fb9864d477611fa1882e2853759f5d86267c8bd3da5c8f6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa05fa684c6bdbd3d6009821db95047237559422 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1b6ffeb8447c5c6573a1dc920e1dc0d7a0e95109ab76ad93351bfe23e5c2b09 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55ed8b1c599aa73cd861e79b16f023af45379224 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35030d76e9ec5fccd15b80405e4c8cdc5b892265856e79c2e23ef2c04266de18 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0299573c0bd5cd2682e75c16e981c9d1ed5b3e3c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d06bef771831ec6563faef9f6fc4a2494fde757e97a1ea9b6ea51653b14387b5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5133552e68d411c6e8e988d059418fdec9099db6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3325f2855ddf57a45a5878b96df70d289c9f0564f1fc7429dfffcdc3c46de458 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2b9a6aecd769ab36903d65f738b4499d86515d0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:693025752d02940aac5ba30fdc3797b001b25e7809db8bac8dd9461ac2556c36 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71eff8b110b07487619f98a79c96c6ff0c3dd5ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ada7403017efe3eb8a3ad82e0f7fb8a99d1bd6a4091bbed8675a726532aa188c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16b968682d5a98b7cb4cb261e893e67a565721b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36a9d085d59aebeca21d247eb0fcdf6b1a32ba9d62945acce665a56dda091f69 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cbcbb12fee959d134408965a31b17ed2dec4729 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43f410bb8a1c2299bd3f25c66ef4bff02d1c01837c16e0dedf037f5f6cee07be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..121f2a2c97c2639204c9004e7bbf5ef045d207c7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca3eea77533555fed9a502394521835d18931127fa601af530c8f937fd73be48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6e58ac4c8cf91be627d01236299e4818ecd099c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bab5be9ae6e0885455d829286c5a9e2ff48831f34687d8b8ca5e5b22e4e99ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e44c5f5489e708e0ee6aa22e6547e78e6b85552e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d4e24a27caac1f9930234c391248404679000c6339bd95f699277ae97829be5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce5a89bfa486e614712741438f027efc2d139a05 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d889a6f72726453a60c8c0f0ed52b971eb0517fed1b71f11a938a7b7c7cdb97d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c69b0072758b78a617adbdc04fb91dacfb4969cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35815d5be1da09082232a0065e4ac55e7a1a5f0c08a39f33932184d050347ec0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b4003fc3d7e56866c7e43664ff62f6487eb1cb1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:520e84c7a87ceff0877d281148a7b84e480c1dc8a80f036c4e8473aad00e17f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18a1250068e96cae41eade4bb09365fc6e578e79 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:746b7a433c6005f48973c105c877bcb8dbd2366f0d38551c080ebad449854bf5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b5039a0a0cae29db4e46d2b0e9ae4ae3ca9f433 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea938791d30e68f20b363fddf549dc15dbb9203f58b8ac2f54a506689c620202 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a30bc31e9b3272e97891dd675986af9fa9363ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ce6054f3cb0ee984d05a0765d3cf32721842253ca690e714de4ba09e7d0cd67 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad4caf42fc83f6d9c0f9c6a6daacd6fbe17297ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93dd82b4c43228a6b75743328bd6bf82b18911a350c99c4b23069f34fae1b2ca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe4837b0d923d57a431e5f81c0ca19c80e2f9138 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2b31dfb9efda8e708b79c401d68ab9ddb9ee4135d989e91beefe99fb18a1b06 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..87a9c22d7c56494d2048532bbb368ccbe44f185b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8034978ac58c02e7f55baecf6a96db088452e1cd0b9b59fd084bd83ca8b5dd44 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97820a71d9a81a5187f3610059f44fdc7950b129 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddcf2ed83ec61b83207aa879f2dd630322eda77afbc5da98a8e06878c624cc93 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00a944f5d9016cafd905677574830aaab82ffe5c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb7541bfdfbaf69c7fd2d019f451eb81e9252a7f9ef5a33b9820b3c6462b9e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91c7b072c4e0ff73c45ebb004ed363b0e4cae637 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b433d1a6fcbe283f9c2afa7e27c34af0a4e391036a1365bbb15ae94918d35802 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a061307c936ae0adda192ce8f436c6c4cdb0a393 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5672fdbdafc2f293fe0b26b2fb420f127451cb4adbe15dbf738ed33f453d8c1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfb4d3b4b5236ae87380563556495b396a1ad1ee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8809bd62caaac7c62e1105425143618bd8fd32d08e063669ddefc7864b0f40ca +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a52b9752e5bd7cb353354c0b509172f24dee2f1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd6e02a79a60625b29690c0f73f2a7698e7fd21b8c8ea7476c8a30d4c91630d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad5647a8f913116337876b273f616c3f916763fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec0aac66e0b29f653a90d45c11852106789259ef2a2381225805155f0289af48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..35b03f85bcbd150c7c593eaef631612b776979af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73dc948fde9ab41741f76353d812e4c586d93cb52412a7b5932ff6c21f0bc0bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11f12ce36358d14ddc067106ca6f4d86dcc44977 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5814d312e6bc244d3657a531dd54e5b16bb11492258d21b9d817b41d2aeb0dd1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbb9b0208dc2345cf46124608ea102d71fec36f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37bb3713f006460146a24e9391b0234b1cb52056fbd652c15d83b7ec4a716549 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..116d53d1bba68b60af1b1ebfae070d97092d5ffb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49b051901a67b7949f46883c582a6cdae726c75137c5d92a77df405f597ca5fe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..85149abe593a3eb2ad8510cabb97448e42516268 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:613cb159ef6a5ba8df68c7b1464b3bf468ce244503884c8a3910bfd25222ee6b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..deb0488fb12f793085cbdc9b866af91f4f536043 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27f3ec0636e94d6aef9868384e6c090ce39f76094ed5c3c1c4608ca959087233 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0271076bfd85fbb05b19592a3a36921398c1d5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce1581df44aa47c8155bb6e598966582dc101bdc58bb020d600d43e74f0cda6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63a7a2ae30d65ec5dd6ddf3caa8848b95c194506 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a52a6551f37083c21bb9819044be7e3c3e01de6b3d4f94ab9a49d4d7d29b14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a8d48c4abf8267f73797c4ab5409f3208373c16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aa8ebcaa2e9f4de591f9b76ff11e120bbaab8226093fb290382d4c7611f9296 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e780f3cc5124ab5f5b4a91ff89c60db6d4d42c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb047e156d78b0ec100116d0bcf40aaf2cd34c7bb10f82429d4d06074bbc7e3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed0413a73c168e4cadea83f60602dd8c6e2ce56b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a82f1a82e832b9b59bb78ba51f61d0f6f5465792d504c010869f72c7aef148 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2cd83e83eecb2dfb2b1b132fb6610138ba26f97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbe188313498b48822b6fa41f63f7f73b2cccc869818d1c9d45b52339271a529 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd1c2a73406af209533df684b06c7dee4b44a98d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d32f6f04b68e769ec5d75c6a897ef3887f729578078d0d261344d1d248c40c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..753b408621dac17fc6c63764a176bc3073c57c8c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf5bb59ac0fb9bda0c557917c8cb811f46d4ce10c42487d34e68ff7edf6b5aac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f1400ba438dd6e6d6d0ae3cad082cfb96338ae7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82f598883433f2084ca603bd4b6f4629315fef37d5b9d940be268b835b7a0eae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..baff46ce2110423f351638341b11b46a865a76fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:148f27c6c6d32c250b261966889ea473b619e6a8a929c23b68df6b249e7cc076 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..10520634386b057fa715d79192c269e3e96dcab3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56a41cb5f5561dbe7de6fea95752e11536a257464c4a99ccbae4441493e75dc0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1855394c771ddf6ac92bcd31cefdf8c15332509c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dbb205d33db8443a93d91c330f82137107fcb4f9e80c45a4c863f270304fa35 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbf48d10fe659b0c1a736bdd3f5fd4bb15ec73dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d724202c9bc6f9d2da52fe475172d70c03ff4219cdcde6172994acf6e62961be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f929a8992442a52e0bc254ac90fca627f3ca76e0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2ea2b82da89a177ac0a6ad078c55316462319c228a12da737e3f5d13566031d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5263e761fbaec7710b13673299e5c499c4af1608 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99d09bf4946cee41fb39e88113d0313c7684cb647fb1def93b8efd28b343c21 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4c323cb88d084439c30b2618a7d95ec44b6f0e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2887896934e994fa5a3bafaa5e4e2bda3dc6155ef06f57808f2f0338507a960c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5abb5264993c34792a35a21e9604c390b7aa0ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9239e8b30070092bb45504cf145aec09f9608684b530c119af186bd2a78dd731 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1580693125b2a50dffd93f92e030feaa50e5de5c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08ff1cd654f6b8248d56e0539ee4c2b1d438c16be8e3e8ec3546ae5cd1de603a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0f5aa83d84b76de0a37ffd82cc0ab0964f78904 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d221cdad4262deb60aa6d702639cce36b7a9b096509f27d00a02bc081695cbd2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eadeaf4a7145d9ad356d653aa488e85b59ddbab4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:091e0204f32d5ddd6b16e9d33ba40bc01c56d3ed1db4ac86963efba2a9ef4877 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..84687a5f45a1f4437e9e18fc26e3c433353c2435 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b84ac3a3741f63183921d13a1d601df3fd5ed2f5496acac4cf37ec6bb81f2d51 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38e3a330db0fea00732e8d3dc19018eae77a0f19 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22c57841a964c8dca2156ddd6d64202fa60cec7f9194962192081167ae9e0a67 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..23136c66fa2c3c05eca32806cf6fdaffff9954fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:931306251626c2e58d9c383aea7ce78e2415f3282c9d7677a6be52de4115c62f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1343d65fb0bc07417a38b0fd4c666cc9925eaf4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7096120cec09b5c995af5a7c365b780d0f06759ada0bad8bdf0a23d091301cb8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3cad2fd39d41c54a1a0369280ba7326bbf8d5a8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe3ffa50355341e8c467607545d71e4b769d4b9b24e09ebe3db3e28a9d4a94fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..243b0082f36ab0c71223f15939fb30cb2d5983a0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a3cc2eda4c2ff5f8666fa5588b75884fb01e2d1073d4b27c39c29bfeb2348c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aea61322c645766d207d2b9a5524e7fc6f6adf69 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5263213fe60f2b7111545e7b462675298fe4ac804749a647a67c99b0b3689a27 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d47a09fd313383d6a805c62ccc06f890746d4da6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4b4cc89548335c0e1e3bac157297a139dc72d207b4ff46aa038f809e1f685be +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dc97c21b5bdd8ae79e454a4e0310394effe93de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c2b44ebd7cb68a1067173f09c28c8974cf8b8c76b1db4544a2d340f449bb23c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5698123cf9e123db749ce25e6fa59b7f62745af5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feca25623f006976adc4ede1c6a01a4734aaf3ce8be182f24e7305fcd80b5580 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8acabd613296f4c5a511b2e331afdfd62f809de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d655f23808cff417e9a579d0d253588a4b592bb89806fc0c2fb63ef3f8d24bb6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69112f6e245696475d31cdb3a4a2d9f8d9174664 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d0c02cc3e9d0647bb5283c2add2ab23f77851a547bf5f3e91d1e95a15062f5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..35b3aaeb01bc0a4ee37d81e0b1f44f1d5f01110f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3248ef19e3d857d6ffaa002a15f8af0edda3f6f2bfb4fa801e2e6d2107baca3e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..deae1fe5d238d89c01b8e9dd507ab6ec7b181786 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42151786b29b900b0269f607b3dd4977c91cf4af415c34818733edc2cba42753 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..355fd66a6964ebb1e6b297417d48f3fa8d948310 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de810299dabd37d80f892fb5d455200f35316ce859af7e9d491381452f526e76 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4fa9daff14e9caf54b8c0c46e685758ca570643 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0155a41bb04f4712a926a88f82ef1ad09650981175da6b4b3c4abfd63fea42b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..833eb1fd7cf78426d37d7c9a5627c699ff812314 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c43bdeb4e8db06886002dbc0202a063868683bda1f80b4ee30062a992db91f9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..124f727cf606a1114b1676379d6fa8e155f7f3ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2924137fb41c686b8f299950ceb1911b711266d62c65c44cc41cc279fa7819f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38d37963bda73416a58957e18ce9e4908e7eb648 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c4aaddb28c6b44b591bc773b89181af74ebcf4f0cf8e48402d0c791665688ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..680f7b961b29bf32570a8ad287fecd3411252dc0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:316cb2d8889fca9ca4257efedb2708054e3a4a5b45055c758c6f91522a5da2c3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75b55fcbfa47a710a69cc4771c5aac522e1b8ad9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aef6f389a84f5aa271bb1636255aced695a7118597718e2ea3d1d71aab67a186 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e079bc26fc885ba0205c2c3edee48da371ab637c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d234bc481b0143a8f3ab147e116c73c316809ae82c7371c8e5fc9628a084bd89 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4daacfa6bb8b5e3075868206b76f2854c34f7b45 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f170176c55b4c962a63c94aad600e1511d2767550ad8511bf2f48b6fb082422b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40e9926d4e776b2154eb47183600f0368e828064 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:205d4e35f141b80406ed5520a6e92c39a38a7707e8c29e9b64c86fa6348774a0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e3efdbbf5e17d80e4e101e94672baa18e37c31a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0291fff1dcabdef5772ba4b463c0e58c9a7c18f22680ba85a9f1c12332467f1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d0ccd355e09eea4e0630d949f69b165311cefea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24147e4bd8463c67e3368a97a6e7bde3dc5aa9788c139b827fee9b206b293826 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..310c0ac4044eec54331955de9c3baa6ae34bd473 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aff77567e0f3122c8719e579ab96706d4c393eda0c3802541a690d208f5270a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c423075a08a493b561c5b4ad362d689858516eac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82f3b77b5c266cecac619f24c08a33f456911b461ca3b6283c83d1dea974a67b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a653f6c998d654225ea212833906e7f9e86314e3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c745ec7b9966c9ec97454358d97ee50f2de1cae1ba8143757d70aaec3023cbe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5614e7cb7be88329448cd7d5fc0b765d3e2c1e47 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2029d5486086e097dd86ee7562b7cafe6f398a393873df82e51f3e512707281 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57d9691f04ca23bfdd9e72f0c72202c19a5a0863 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:301fca76f955eea7c0e5d82f2ba2606d5c31c24fabea71ea7ee46195bfe9eac5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50d9169f38425953471e2feb1af57811bc581c68 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc8455c690251f366c577706e330c5642c926b507c1bf52a13ccbd2aa9942b80 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64b0a797c39a0385688089f7224e20a326c4068d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c735911330f1b63cfabc4b5aaa286395dd00d3e30a05b0d2f43dc37df7cadc7a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef3b417fe815b2e129d107d88606abcb771b9151 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1a50e3ef1940b6a07d71f67b4ba5a746aa25899b634828dfcaf15335d0663d8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..462c82bab53335f0dcfb40e3ff7b709a77eacdfe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a1d6c92256421eeceee3061bc9e60ede386ebeefa7153005525f0f708cdc5f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e44b12fce1ec3488028227f26b7075c518d2868 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94f09c66c2190e691fdff68500a4a19142b96e78dab9f29574e683cb13d09067 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbc73eba95b7046bd0d4477b3e6944672d379eda --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:479bb67428dc5215865bd6c858aca099fc26ade78beb74338bd23ef169cd5c27 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..853c9830cf4e2e97125e3fd2d534c4ec7f5dc972 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0369a7ded73f5b17d0c82c6ee049d145d94c5921b5ca2dbf329b37667e496efc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..caf7f7cc3b8a02f6e41360316ed4d6676b4ce5c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:685e63a9662e24dcd02b276312d56e857cfb2293ffa7870d1b778224290f2544 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..250bc253e3aecd80807d3fdf86f72d73d4ac83f7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9f363078e8a84898488b4b10bba13d1ea7432d3b617f764371c7d0ddfc41507 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..34dd4312203e1dfd95b0ae648ee3c6668e1f7a10 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbe707683c540b2d7425be27095389c23119223429c9c1f361a8eb95ca1f4ff1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e88b9bb5a75eb62df5de71869b1ccbb868b14132 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf1aafa23526af7a511931399d3e3af8789a1d9781708a67762e9ba2ce7d36d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8a850b2286af86dbf9b76b2961caddde90e1bfe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0d88f59f0d66d21e2fd9cbbdcd5823c72ad585147aa4e7d0fa25541829a40c3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ace8a06002d004d015d34b9d9c35bbb8ccaf224 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a9f67daf19f1d34f27ff2458911cc5e7cbb6eb5900c7cbd8dfff3591b96e3f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..daf6f6aab2c985802afd58d76b7a39fbddebc6e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1acd5d9adb3eefa2d6842de0f745b4ae7e02181ae8b847160f38f21586bb9bbd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..926f9e657a5e655c12cf7ae686dc3df7c024e93b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c08b719f6bdc721278a312d3bd091bb45b5e59eb687c768a4e936543ff79c4fe +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8166e9e2a6111c5dbe0d4eea8fcd182017d5072 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2234c60211ca5e68292fc53b8baed184ce5c4a2d31da28f7e3c7d6169392e6b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b3d140557b4d5bb6e97d53e3796ca0aa71cab76 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99c30a9a747f734d5ef580d2415ca8c743a2622fc431fec1724591db37c6220f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1169953e871aaa773f0277f20c74a9b9da7b46b8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22fa0943ecf025405aeb369f6c86b61789082994ad5360dbfc74de44b1882e68 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84ef07b6b1e464b9ca2cf6fb60010611d2f022c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a504b6f0b5abcd914999bc2b0fd5ac578e2d97a10980063e059dac2fe0acf8a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9576e8a63a4eb7fed8f1505bac3e21c77cff97d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef225f73f0bd400622e6fc698c9053d83a196e170596cb712a1dab2d1a4649a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a21f4bdfabfa7583e19816110a631b5845a2bce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27b46cbfea57156a99dacb8371c4ebf02c1447276b1788a0df94a0cf22e0acab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..926a177ac5cf93b045941510c837677dc9739511 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82a16b864875cacff7f91e17d323e82dd136084926b8f068e12bf61ead1b71e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1d6c3811c32c1ba0684996dd59758e5d3b6b4c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd30cd8108939aaec8a33bd693891c109d681feda307f00b5eef809e4f42687 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c44144e9ac5aa8e60a0f303b803ecec3042d5ae1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d106799005f7577d87a0bb8a75acd09d12efa5c511e6c65ae6f8872d81193e14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e866ae79fd41fbb52e3c3636db90b11414b9c26 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12b1fa29749f798dba25b831cd4dc23854eca490a013ba6ccd2c2853b27c49a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a6ff4d47fa42235c23d7d7a56a707be8b95c23b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3b6ca2936e51fbe23854aaccf0c55792cf6e610f03a746f1526d4a818f20222 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b55dd39bdd7350a5639b8250b8274acaf06ed8d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0b5c9899291a30f3663fcc575ca1b35b387789d6247865c7f30320e82845f68 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e45d4aaae9cf50c6a08d1ccba51465c9697b0ae8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ab01724ca306d29ea63735b258485779d5affbb48ac5714a490a183e80645b6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39498003d63195e9b574d3f3138d3612a75623d3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96ca64c1ab9a02e1557c8675be01ee4857b104e0b34656ae57f0bdaca49b890e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b7d95c5786bb2756a24e7aafd9427c3fe410cf4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3990233852b718a879e19be3b3601c3141b82642106abaf4d5cdbcfb3de03f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a585468a10b30850d39244cde426474c0b647a1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e9aa1c7d1c761b5208a8ec4c752ac4ed45d3cc96ce55ced7231d882df96c4b8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ffef5d476a27c48c4ff640754d40e209bed63da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e74fe3f9374c560e7793637665a1f622513f061c0e515d01a51ddec0a2be1aa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93b16f6f302d6688a5e214e1e8acb7649c60a814 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8d2747c7283931b9f236c6ee7925d7d8a14042cc9d9fc5b4e3bebea6132c0e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f9575f8c9c9c44353131125d15957376c16df95 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d82826205146a36434b573805f2d54485286ba536fd6ad4ff82f819c226656 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80c76ab1a9efaff9a627405ba3b12ab8da7be339 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7180f9e05c191c68c04c3a9fe0061eea7809d9c1316a50618b6a800d2d405231 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..985fa15459fcbb9f896cddc7725dfcba8cc51fdf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc889fdd457149d0184db37da192f87e7315787c2e6994066bee64b43fe37161 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27df7e42515a92db4716ab4f4ece071199ae9600 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3d9cd664607adb8e43aae7699f8b8dcc59e0bc3cd628987564109ced054522b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1a241fd17413b4f3b817fae8db4b4c4a0fa4a8a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3fc12a0db1a570bfb6adf0d0f446aeae960cc53093a2fd5e270a0cb3fcc511e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed6b837656f3f1440dd1ee0c76ee6593b6113290 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:798f9e0ea51865453264a908caecf19a287033299dbc0822a343190c503623f5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c84fc76d4e9b8eeff5a851c57178254108a656eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d7c28610088311cef3031163f22c3dd6684e187cc953b8b8b169dd408d853e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..070674abf724f1d0644ab98b355732d34206f0bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5265867abfb071c7e745094f84603c5a451150128c4d36b8dbdfeaef3ef10f1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0befd0b1add2f63a40fe7d933aa1eb70a011a814 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9b08190099769cc06cf7cb4ef5c564e0f890fc21abf3c12228b3924ee7f561a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bac91128f2bbf53716492e5de9c7fed5cb869445 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8b4f6db2db9e6c53392be5679d145a12c08e5f100dec35f31e21ad064e0cf2f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dafc8d2077ca0815b2ee2197b96605e734daddc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab736828d72d4c23f28b2ae3ff3a21ee90c8a5cb0d0184433bfe6e16cedf7a00 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9e54b95d10006ff402a2b037b41fff0487295ab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d9fef0d808fb0a152e4e6e83111afa622a4dc525aee891fd33939546a2cd7d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03ac2dd985afd1dd7041cea2306d7ec63d204723 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:175cf8f1a92024ff9176112cc37ec5f5978acda1778cdc33df01f1e738179e5e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07432c297fd6101282b4ffe4f1ff72fdaeadfe29 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48cfa5cfff2d47d5f216a58e3d7a88a57982b0d4a9503bb16baa4cd6e0210d97 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55e91e3a2f65652151252558f266a13f039117ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53e2a91d6df7695c2841d0b950a079522ae1df1b637a7fedd1d44391e69dd08f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdd44e085ecefbbb645c556095027e3f61526bbb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ef965b1bc79713540a6afb5749c43eef2cbf86718f46bde4f444b7e420e9d89 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dfa08f48980cfa34e6f66bedfc09763c1e090e9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f811d381ae4abfacb5cdc65ad19724617b254de69c574e6c34a0f8994bb100b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9038ec55dff2497e73982b3fdc523ed6419dff78 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d1f73fdb500902e230772e9e676bbce3783c84fc704ee97261f139ac9afa413 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c8dcbb9e673d3632924dccf651c96cbc21697b6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05ce2243c34a62b9707df8f7da225d05a240fd2d2b908db254dcf0f7809dd1dc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7600cad10e6b2c451aad12fb252c68f624819a94 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d5b2ceb8e1d191ad5293eec81d124ab023f064641de05210ccbece5ab4a87f4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52e20e6b5750d35a171a1e7ee05102606b819750 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cde46bb306f2887c38bf4fe4e79fec7d21bba855690e52325d2e344bab4fc16 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..022945a86ca205bb6b176ac32ab6025ed3fcb523 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c7702a03685da79461e0171537eca2286f8e47250050f807b108d83e06ddd9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ce23e0a077540517de5ad956d25a718da4e7fb1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecca20fdc357f89d3de9089dba889f976b40742a51063fd15e7dddd369a15562 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca412b154c1c6bd8ea32786a580a447bab76e262 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40071f249012d54aff2fc6a4f979dd62a4f73781c121271dad729817115222a5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..95a9e92664b0a2ac6de7f18a4eb9633229475f51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b01f5b48569eaf37aa7299c872736df037061c37e11d12e8d44b1597edfb9c66 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5cb328f8801430f09ed82ba2f9c3fe9139c4e5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e09f34396c6f6142e86257064bcadd46b7def22e967296e08a991dfbb44566a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..871d295521969b520dfbe0d978230a374ec3a8f1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6f9f9129cc4f938ae970457e0565e51fee6d0a5e649a0753d1312362ebf03e0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..905eb8f7004f6254779fd3a88794dfdf46ab11cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32b2e155072b15b45f372cc46f2cc73bbbf9bc0ca475bc7706288db1e759b84d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc2a6e72edbb4a0aa927b9cd5854af7bb6d89fbc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:088922beb4a62abb0c8f438fdf1f238a4bf94e2c3c13265b83e85217798f3deb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d35dbc3f19aa27617f8d454f51ad855f74c10259 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1075536fceead1ff740470bea4166eea79c4f8257cb040f8ed1b21184ed8fe9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2c89a7040d91f15e8c6464852f0a7f8f2511f7b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de20120ac1d452002202a8566308c8d8f5aaf529b11d4059a27c197ee1c7e70d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c0f5e3183a222b55098fd6ab5fd133835f0f555 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2bbbbb56e74aa8132012df2769a054e6833b20a2805eaf0159af8f488dd2f54 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1feb45e642fc82d7a0c48959c455b8d146410548 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca46668e65d69c100e40fc2bca9ea4a271bc1a32bf8f8f190dd8e50c916a282 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..add92278215f02ff78da0bb5bf5cb17250d99d78 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4377ae87673f728b488bbf42c1c27cda18c23fa3bb7d962e8e332cb02746ddb0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c57731da948c3a917210edaf8103a55e5890c309 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef685600635966674ef3c5ba9c75a1d247be738b14e21019a74fcd9cdc476a9b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74dc0243aede1cb87b831356ab74b097e4148e5f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d9b7dd7290bb8d933405159a3fa01999271ecc5aa39bd05bde28ceb9d5069c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..01690191e354230fac6d09f9cdfc50cc451c6439 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f28f659fbc9434462a5ef54d447e1cb2b9282ed329827e1f4113eeda77def413 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8da4c40331c9ff95fc7428889f58c1c3b3d62638 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db83f20b0a077277b9962fdba38c124c7a8f8548d7c6657ceca12c517aa91d86 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75f69c4f7cd687bfdf98af21d778b5cdd2ca895b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb15ebe177fa80306c24ebcd3e949ae3d9714d465f4e57cb67b6eaf3136695d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcc8a5d227b8bb7c4a39b095e725e62d0434ea85 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:433737898bc497aa19e8830ae9398e470e30b684df7d6dcaccaac2816f27acab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2f4bec34842359af225ffc08c5b0be56fa71be7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a78b256a0933badd4088966290c004f34c1f789977be6728ad80c23034dd29a0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b61e6cce590f99f7e72574d3ff4a3caa32f5b45 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7e22c53eef215f6a53a9d9932081b7193779c9ee0a0298e60e4c95fceb0736d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae573600278c6ddeba85e6e6ca699ee1cfe828a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c7242d0c6325b620498315a2cc7791ff1791df30f52aab341bdd63e95df5a1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..996efd07394b65b8f4805a5170dae81ebe20b347 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60e19c193f2979992d70e17c690708cff83974c69aa138835d8c40170aed6fed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28638b030b463ed3bb4fd35d4b5c8efa5b02aae0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:272876bbfdaa2d75361389d2766f777b15a3b3353c288751a4565e516c47d78e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c66f007d426387d23663c8aec50cfa002662e05d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c900cbb62e64e08750f2f4a67ed290a106bcebbc9b0aa4754c3b4b620d71842 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27d9af684085ed23f90161b7d4e03ac2ddbb3a86 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bce78c33b5353aca20a2665d1f314ea69a412bd41f232acd72246287dd40bab6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fab825a5c4e994d07856d9db0e781a08a7afd65 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bca8508204d07445406bb0c6b401252da432a1907a9087924a01e56df4c8697b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6813227f41eaf918c9ac1cbbdf7e47a97f0c6618 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bbde9354e2b18770d5b1fe363a0b5981c8b03ba52c2bda6270fc5d0f517b9a2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a1db48635f123f1b5a9cb2ca70c07834ea5b278 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c82b6a66a7e61830418cb7178015ea5f8769621395911eae3f13daa8c052d0e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2ab9d47aba229ad4083f0ffb518d23dfba9d2f2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e7b1278ca04c37007041613a3fd1e7f4ab40ee0dcffc1fd7ade27d1361ea9c1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0485e901218441b4a96cc9190ae6cc1a9e8d790c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02be60506533ba337bcf998d01ae57bc56a0586b97c64b78fec8859119f4ab96 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cba93c288348a0068d48d68e8ea6915d7a4d0678 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26e8560184dd7333002043a81fd58e21b651d4a74118e1abf2278d04ddc03dd4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e4c7caba35dff13d39caf82b3e8feb816782886 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98867835c1bc221425021c178e06d18e67835dc7e1cf83ea0f4c3a9987c0ce0c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5f660e18cbb46aa28aa22939711ef414c33d1a0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6bc8abb415ec78dffe000a0869906c63e5c9cacfaa8536eb58d1b9ac3273c8e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1df15c641d458b6272937d624b1fb9c32e739d02 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f9d9ad08dc66d073ac36162f7c3923886f9423665d3c47c995207e9cb217a46 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3746ce329a7f07a455326b3a8318cc9c03c0780a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5245dcacfde14a52860b441fb360644d8723224f7c582713a49d0cee36c5cf14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bc1edaa595e4d3424758b41be98b0372e70d8f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292d9cab50b24b9f6143570a05205ed70edba4eb154e7c688962806803bc908c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96aea624a93c3739e78afeb6bf8df5ad977cacd0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:130d2bf9a9df29dd35d9957a95fac845e636a8d656c708d422363d494e35540b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e331d3bfdbfb331cde1b9799063004a9ed8afcf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d219b6bb6a00286699d3fe39bdca683e7a19351101a23bd98ea6a306c3916d9c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ebe12ad604d350eea32b89094822f58dbc58c0e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:852636ce55c963d6212760010f95ba089f4f5915c44c125825b632c0de31999b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d8799ec92debee203cfec7f99ced983babcad24 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdd00501cc67e594e89b34e0b38395845a9624725c0d7caeb47fa1385a0940fb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1e5f0bd13edda0febd08fbd410a186f767d56b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ffb12a5f828c7b99533742d68182f5c10f456bdd55e014e38801d454ab3b252 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..402d799c21198d18d93d91ae97b631f37d2ae65e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be93654f2e86ee0f52b8fa34d29ed48b3e50cb0acc7f67106adb9c7bd8a1f932 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..757472689e13994c6c85e83f820a7b778cf14b50 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8517036dd02ee271fa2696b33288b7152a5891145e92f62d15e78b3c9cf13504 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30546cada2881639353948955c8e5c269d11068d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c21644ae274839c2ebd4aba1d7dec9f1102e14af5355bd92d48e80422e5eb61c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9263703cbf5c4f4f44125aeda23e3011042ca5e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f1c6dd44d835c7e0df9315d976866ef27b4ed9face3d0779424e83e327977ad +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e96656c855c16fdb3a920d63d52b21e743186b8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ded6fe2338a3f073fc7ee24305d14c9f642fd14d6e88306410c9f5f16d2330d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..286fae7129643a809cb1a8734206e7bd781f0235 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9008f17790a118277af1715f9ba29b549decb650c49c5cdf8d26460bd404da1e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..406f40ff83f89fc9bd73341a16c64824306e1894 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5ceb7e6383d58f954757af97ff990f364fa42166c7d4ef1878dcfd362bcf008 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a99fa0dbda8b059f28eafe8d9d81d218c790c42 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a416a20b6d1883256336bf837e33c1690be2f933aad62ab88e67787c7b581b57 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66110bffdef03f3401e841f7c75c8f59d1fefe21 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5448fe925b91dc30c0745584afb0952ee9eb7d6c2dccbeba0c3a5b52e82de576 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..346a49b28abbc50400c35cab758219782f62efda --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11bfa1e0331f910f2d1a812abb47993d6d162c36029bce91df808557f4f7d90 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c66203b608cbe0be053fd07ab39d6a2ecd40aa2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cf6920c5e846a47bba2d5888fbd2a4ff331e8590fa67091ada144eed6a7fede +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be2868e6f87cb33cc82d0b53640179a86dd0133d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31d58451fcfaccded3beacc4df42f8bbda60b77a9a58db45464675bcb6fd66fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d321d6a061c4bc11a6f339d9e49198f449c6d0c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2da892fd4694d3c06b62d45ed99f8e096afd07913f8c0f274927f2da41dc9705 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c755291e60e3330d71a3ee91a1bde3d49dd3a13 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13533cc8eab2840b3221497e4a6262090e18546de0d84f47c1c89a6dbecdda0a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c9bda3f156b5132de0c32a78fcfe7cdef2e881b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf52fe1a7ff93d19fb17f53ce59fe3440deff96a91941724d7c08205f33a55a7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e99b11abc40066012b70770314b15f7bd73cbc1e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f1b83417f90a106bca4dab8647535aa35cf841429a62225587d70376a9b2d3f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60d047b38689514111cf8e57d84d9f3f3f76d58c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ebb06adb976c2264bebfe83192d4ca973ff470e99b62103ff4a7c907775f96f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b868daa12367280bc21b4636661170d7a54ef15 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:766c67ae5665b2622c43e327b9070713386b6fb9e6d350dea455eae45e5c4075 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3073ea10a75db7ee571fd2e05779c7f64d504ed0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292fc16bcf2cb4422e6045453f5624a40a3ce72d43f40392f4a4d6f5da1f43b3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c17400f8cce2b520e7c75b728d05317dbc1859cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a13fca86c0eb777077fef379611c21a4900f045b54ee98e819f2724cf810dfc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1426790ac2a86b796801cae64561d1de655887b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971665324b4668b031d86cd0cff5c82846433a21c155fb902aa6bb5b2597b105 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f58648aa1f48439ff1f9161ffa6cd07cd0bdf63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb2cdbd6ed17971eeb036f7198ebf7ef8e540f6697306d8fd5c13f3945c8c14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3cd456ca52e3eaa997d50094ef680db85e6bae1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:116402d50184002b82cd5ff86de43cf920f7b4136b0adf68276e1545421e5ee4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64ee803d9b937d314d222c1eb27bbc007c44fa2e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b90cb37584792ddb132634ec24464090595f559ce3d6e0b2b7ea87d30eb6c81e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a673af0b18e0cd17c6944a0fd05e5a781b1676dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32ca339ada8c91aeba6504f17cff72f5acf023c354b1450456004b17003fce03 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ca29c0b951a76ab48a3a429efd01e0667933d21 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8274884f48bb490b132bb0f2f6ecde382b1372fb8257dcf0a5beb967b319ac6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e41cd68364d5132be0ae1dcbd5b06bd3d6bcecd1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61ea9733208633484302698c981070f5464d641513ac67b1b4204499f5ebe2ef +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7d0ee14a3460cb003ad781f4d7b207af26e90ee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3fe286264229abbc9745aebc3d1579117467d38e8b6f514408307c3a639de59 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b38d681a601428666a420251d96385cfff08267d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0280d5acad94bb896beb4b74a149d0942f698ec07f4f58db5987e2e8d448d35 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dac8a5795ad7c5548b300577ed838cb7ea7d2a4d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:436c3c1d5e59d056c815b836bfdb1e7a5ae73a4ab2f7f26cc61d90727bd8ec31 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9ab0a0683669183c8876296933098218e9bc806 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10992dea65cfe6824fb055b82cf81f4ca68ad13b1aa6d5efa1561a5f883a8d10 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..599dd4970b51acd822da5b8a0a1945ba83ea72a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08cde14d609bb7506ee9512a0533254f43e7182361d9a0346a756db928117594 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad068bbf2e5852e4f2e11292c2ab55c7d21b0f85 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9f374910e7280d2838ac74fd3e6ace7a728e24159f84b43277ae7fa0b499831 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d18518f171b9f57039525e64daaeeafd37f444b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5109a44e77d15b47c17be8bd15e937594799392a19e304a6d8a381e0006a75bb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a5d2b4cfe4699ebf480748be0adc03a2d60b9fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbee1ca985e9390306e7fefb50365ac38708483cba7b92810603c46557573243 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33dfc5aa42638f24fa44631365f754b73bc36dac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a822a44a37cd2d62d4d8fbb0262e793145e7cfde592c81eff450cbbd6b9ff816 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38d73131cbc125b5f774b893f82aba4c278bd2e7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1b19eaa01ef3eee8a70c6952bb6eaa6ed12a6fd4355aee06a6ab22c9092d687 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..262efea184c513717ae323a07016704db7a43077 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7820d5b4edcbda5eba43c413dac97736a2f0fd1abae64743ddb9b8d86e63938e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c641e5e6c6c79296dff7688d619dbad9d7de44a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ca837f28eb1435773a06bb81c8fbd2e2cc88588036b38c57d8669c9fbdc54a4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5da9e37d08519a4731cd5eb6605126055dff4a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c066fe09fe2f95e94abd6799fec7e1a6420910fa235676c924125ef7b003fe58 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0cd2762e36e9752c0e66c555ed863b6d6543b81 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eb2b19d9b2cb7b1f97bfe89e5ee67730b1cf9eb75166f3d7acd435d561abe4a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fe518bc5ed153c1aebc750e028bb54fbd7460a1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:820c311eef9c8f195f82e0afcb702aa6331467a0721b0ca6e532cc27b3982e0e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f1ac808a1663fbf89fd63564a1bab589ec16a1b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b005fda593d55e160b8b4486c533b2c5066ab828e22fc3c8f33c4045c92b1187 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7271c48132512e659c72e1aef5310443d09901e3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc5d2fefa6cccce986294a7833c023df7c2d6768f1c481b6c9b70d78fe6942e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f72e61a0701bb55a823fca63fa3f068ff19fafde --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a16b43090d374fd63907d76dd4038bb971171d72d0b3a9de2418d63bb1a2882f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..938d88db3c6179f099bd74235cec1433597aa68c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3975b916c4defed5cb8167437ab4505d369233ef6615416f1f5f020e62b19577 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2109d951eea6339274b113853e05ffa70fdb372 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c3efbf5ba8c9efea5dd085567aa65adfadb0d0f05f02e17220f8372955e97f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40139d22d9c2079a01a683824570d89a94f8c6c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9683b3e7adcf1a15ecf5e5c533587f79807421110fcdad1fb2139b1403bca363 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfc7cc9c9f77a8cb726201ebbea28d63bd3b7637 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76618176aeaeb558ae1feefe894ee5473b486448abd12934a9cc49a6f29a8c7e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c54a8eb16ef09222f7756a53e09ac02bab12780 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb317748e5df83ba493d8450e92b2e60ebb52bd6d32eba1dd1ec2568c7ac3b0f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68855e9c8e9a0c69471d6eb62583a03677614f5b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73451982912fc8e0b480826585ac0f8a0e12c1064221e4f249f162928fc325e2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dabaf012144ee8f2b8965c63fc9ed02dd1520cfb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff92592de249756100e55fd7996af88f6e973816b7d9dad44a1ef1281e1e03e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4464ed86f76d6e3d152658bfc4834af665d9ae7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1826ab8e3ce8fdbb6a29b80a6159b19ceaad242076e304e8c2718a48ebc0b6a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..194b1f7be8b6919f163b3635c9851499b3d2814b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ab7a3ea1ae12054afd29fb10219ea0be87f853f8a34bd99479b09dba71f8bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f414171ae94ea822a53bab6854d2da7e2eabd4b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b4aa4cd872f35d5c0cf4b60d809205a136b2cc331e137a5b39c3edd9a05e7fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ec30b718c8f5fd554f216f7afa64ad0853c31bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f81e132277624a62793d5a6f0287d6aa77aab13cd7b459a4e0178a675aba8b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4656976278f286fd97e7a70daf6665a92bd3a7f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6c7472dcc8dce82b91ac320f5cee0d229853fb52f1a5e09223420f06c1b38ff +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f53ff4fb089b73ba521a5342b86ad1f1bbbe76de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b3e0d1b3c27f186c563000d9adbdfa79029118b3effa36aa8c76aceb88a552 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99993a45bb0b265c4fd399b938ff87abcfdec207 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01b83b6f6412da7b4cd8e8c9e8e8a899b55699cd4c3c366aef3e6f839285211a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08569dbe9ccf97679d90b568e901d73bf1fc0d0a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8a106153b89db71e423743797b6f4c52c45d255f1177235f31fee55a31c7411 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09fc23056d261086d94ca3d3d08867b269788a80 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0184484072dc8af9eceffcfb667d86a73077aa96f3e79ffcc9f5557f99ed141 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..615181c2ab26f063e592e707e1588267311ff81a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc87e9778c8c72b0dc4d9199c82050056310b0fd1768f70fb1a9ede20e43b16 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f1399ca81867ce1150151c8e92d39eb2b019a7a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47756669b4d3db7498c57353cb670722422ec9426a6898c0ae7168313908751c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ab8fa5b80c7318641c6240871b56dbe538f98ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93a623fe73be11df974cc858dcc39f007af9ff1056099e2a2f859e8cc829a56a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aa5e364463c1907549cf5caa63e1cbcf224c37d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:768cd7f567f6a3b482e6c5878b9b889923c1be1540efcfa2db47089111913cec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e18988a230ad480bc87386685870b0f7c10fc155 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee1788d52000c44141a585d279cd7c0331d3f84d8c07ca364bd6ca9ae4d42c8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8da114551c4f9c7cdbda1b360e1bc950d9fabc7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b1fbd83baaa4e5d0b50213acb303d7d93a6a8b63523a8986e3eb5b50f9f0b85 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccddd963450ae387d76c61b4272707a495cffc86 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:767789e810f7b34995d3461f92ba36f900696e90f79f2426c9335207eddcc3d7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bc43f77b61bf0b2b861cc9ca5751e85548e3e7f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:000bb9611673820f50fb3c9b6daf4fedb032ae893277afdbfd6f2765f1b641fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..635c8af4a559a351bfc10367f4a54103741b0223 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5599bbd30703422d8179e95c59187abcc3f4c0548726b220a5945a8d2253dae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..744acc99fe611699ac212cd2e2de0eb29bce173d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adf6f0d64b085cda4a00d1ec65479c2b9f5301f3a050bc2bec7d586f6897814b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1e93779060dd85ab8b90b496438b0514a591f33 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4267f58e0db3306042340c6d62b4c8edfb18f5ce429c8cc04e3d5e2b5560287c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f079c81f82154f4c013ceed79806285ed7b77e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aee5a5c965ea29e7c81703a2c318933e74a411c82d995c404d302c23767aefe2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeb3aa845a9a177cae00688a84808c27de90c6fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:323b1d9c14b5dd1cb0dde9200d04fface720dda50f1c791786f6d2369cc1a798 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..192f385266c18ed3c2be283cff983b33b2e391e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:239c33cc85c9597f301060095140a5ad86f70e0f91e8fe76368e78b3e4beb6cf +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cca806c6e2d323efadb9ebf7cbe28c7c7cd393a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f79963f7285ca8d62ad196f895fd0660ce9cb3b150294001148e6c8ccd8c7f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79d1f8304cd54bc9ce20071e363e84a645494d9d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e212093610f2f63aff98bea878e745d38201fdc8a985dba7f4e9847e1f6313 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bb863e68dff6f24185eda526fb605523fc34611 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:142e3643b8aeef36f9cc3ecdc7e89627d9d6a06028071cd30fe216e6ca88037a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a43888e73356281c984ae861dfccd7adb7350d43 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8908c2b029612f96478883753d696ee74cf8b40567a64637037a04a4070337e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d51e4f9e549238c690343aa20892a4a6d4e38131 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a0a3c6ab7f9b1911cef1950564ff95f4464b0c8f797631bbcf505f08771f335 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b84e56017b5179d0b3c2e857f277fd4ce2f0f1cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7ce4ab3fb6713e4256d28cf98da98d8ee8deac46a7baacc2239cc05094f306e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..633a3bfdba11f6d2b6981df43d4d4349e6da1579 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:225a8d8842dbfadd90708be4bbbfb81a07ddbff381bc71b751efafa478d0a468 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e47ed03c41277af8081cd2f94192ff637697d05 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6b5c6f3d77a3ca95a1c64b05bc91df278518bc2e34ef2d0ac16206b51a8a6de +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf4caac25b096c4a412ec7323e2c5e0ed1601922 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c29e7a295c15fcbc0b07d73a5e629e3bceaf1280a073a94708d8f526cba61692 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2adc165f27421edf7d1c825bb917f39d35a0c25a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0d9b86d9c678825c8f9fa85bd0cc0ab12e7ddbd4c2be7555db7444fd7147367 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef747823cf119961aee06d3c7ef2d6fe836206e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4d97406010ba5fc8be94ed3989f9c41f8722a771021ffea1ed9757595d2fb69 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9bb58e4b7d797257dcee5573bab8b69e6c33114 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:721496e275e6e6f5ec7cbb9dfaecd5d05a6c9077f926464f34df1b9265413870 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..76a947016c6ba61e38e2457127c996d43210a980 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4ebcc806d8153d3581d507729a179a0a4e78d99b043277f750a90237a64f72b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70234e3803cccfcc8040632e70025b410a3c478f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a93dc1a56ed5d479a39e04929520e47db94fb53a46d9a370082687c03cd92ab4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6fa2f4c71b6ee69a142690684c14d3c0bcfeaf9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68656574f6d78314cd68a83181e71bd37e5bddeaa90ab511fc88daa350783d28 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24abdbeb571f8c489eccdd8b77dccb74d2d944e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:673bb6889cff209fe1a43ba71ccc7b361b4228f9a33a3f58a4a0909a953cf06e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c3d04b1f626f2b4027248a11bcc419286b0432b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:653b2aa2eb83947b2a082ce7d00f16d5aa0acde447449e5dbda25f570f6fb315 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48b7837e62701efa14a3323ea958edfeb2ef4320 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a706973f2e1017d24715ff0305a988ed983d4f60ab43b28253580a11562a4701 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..880578dada54042b7f8f475ccd09719119c3ae8a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce72c574a6c30bed805c0e1107f47c2b2f1745a397e41aa664dc399abe1eee07 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d64c602468ddceb0d64a5a308eb282699db04e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4997cf92d7b915c2813458ec5165fa0478929f2c741a14ee6bb643fde8eef6de +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e32526381b31fe3d8b35b138159764b1c6115b0a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fec69114a5766c6412ff2b53612b554095fa22c4039db64ba3e48488aab44631 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..845cbbc6243e0508bf8872aff9369afd61e5939e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f40ece0d8950cd47daf5ee77cfd1dfa36d6278e4572cb4eea6b0de8f7df0f3e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3718cf1f5bca564812517ebda6fdf6cefc94902 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a408e320b5535223fa785458f5140fd6d89e7c45061e7054cfd5f274de03913 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e3c75cfd2b0cf880153fa71633e2011b07e0fda --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81a1ac46503be8a36bd4e8ae1b5513b8ec2fd9ce034ec540d11490abfb6bdd98 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cbef66757615ab2661f5b9cd1ba21609cbcbfc7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db23afa55353f8e9706239768c9f43e5192532115ee833e922b2472514e83559 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b5089ff2d81d3699031e0d7ff9892bc66b7766e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a25cc3c6982c0c936c6fd27086810451b17369f1797e5e345775c9d8ed462599 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aa4f5e7369043655853ff2696fed159be4366d6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2db2890678538b1cf1aed77df58e796f3e0dfd830994e02f5910e57a647f822 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4588cb7d755f0f44e8a470e3eb7deb91b1295b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd6955dc23397b931776766a84008b42c470506fbaaa1eb06cd7e272c901f49 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..013bc9799a47e72ecc744a247da2c6179d8ccd89 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84111a0c9f05720d921bf05368562b66b26af29e2e0b8b7bfa36faa7766f8be0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dbcfcf9473d30193d58e49162fa9c71dea37ce8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330baf9bf2a2254e51af8af666f110c6754eb53e3123344088be829809515267 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4844789c96133a3f41c369849def1b32ec21550a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:377e7257b5584bde9cd52f0c29c3b1ffb930a8221763734c7b125d989ac1de90 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..100d1dfd5d01f9cf9876c53c94b2d77f22669f52 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b8c286236bbfd554a9c1fb5e9d0f1288e9213b8855e313107f2d188affe8bba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d52b9bb8450c2ba76484cf64cf7439640fe1cf4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df811bad5d4fb366e8b0636f7b243d81d32abefe138031e26818f1bcc7788752 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb21ae78a544bd9bf04c763738e98ed628e79856 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca846906bb218f9f1308a5304f2981719d415139fc29acd7c70d0a77e0927c4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63161bbb58cecf860e87891b396a9f0166fa8efd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f148ca0e438eeecbc9f8af96c716c7975b223a8f932fe966b8c0131e90e8d68c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94aada33df3b3951406bed4e1ca8155ffcfadfc6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7c9f776a9a6c442eb393ce6b20a13b612836532d357b66646468b2f1e4b8866 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d828f735dcbc6690cdf7d67acb3c0aaf01c9df3c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32157fb33c64e339bf2e945fd58145ecd89687e78b7926d3d6d3e8acb3100da7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..086506aca2d2375627dc465b679cb4a31b153b25 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10e6695b8dcb1fb13d079b8051939622cde14561269b0c33c2ab220b18d6fe5f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cefb02f56914882c227a7145d65342dfc1a2413f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a13313dd4d6bfa81196b0d3308de01e80546e0dd6487abdc36a7784a9fb553c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de263673119d9143b47221e9904ce2f590764daa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b564826de37bbefecc445ed91d812735451fc86b525f1d4340f85487811e4cd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9842d2664b0f85aed5aaf20b4e9f3730259a045 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc596e5173dc76a05570b3cc8f597f4d4b22da88b52aae6da7ee8ded6869c02d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8bbbc3cdd7286a2488572c62dd81bcdb6ac96f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88551f81be3f0e7f3c5a5df188d72eb06511f79440f9bed14ec0e1e0cd5299e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3a323166ef6fc57c98bca2e70f3895bd275eef9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29c1df077f3a76b19a6de0e913ae269a1721b30b5ee5f2f79bdf12d09e1112be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b5f18c4fa1b17e07887f98ed01c921428ba1331 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ddca04675909e00758f35386999d330885e6f4aaa57a02df5dcd856319c862 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dd10aa4f9518439dff188c637effb2f68bc7c41 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad8f63984abd659536b00cdbcf4b36cfab00852a56fadc0477f41034117161f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..225cd9246a009b1e0b550831a3edf1b35e4df0c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e68d7754e35fd38e4f2f2f61f72c7ca08af830ab2cbbce68194b8f61f19935 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a664a36b209f602e1fe0666d7951f7f7103214cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b55cbf96a9254176a294d3002b0846cee6e49f9d979bedf0279970c7ba072c0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cef6d36efc19721f623aabac31aa03e8fe699c20 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da7ff1266ae865dea21e5901ec981f13f9b01a7743d1ff080e6c8ec3fab10bfe +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3926250abae22c4523b9e52a92a5ed5d0e60f4b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c2e1a6417c2d5dbd4acdf11e6586c1cd1ed1b070a02dfb0a140281beb648a75 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..506f26ae894df7f8ad857ef55962e41d3f101d62 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1c0f22fe797d9e013e53f5afaa20538405bac65fa67edc53eab459ff3f9417f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..420deb3b1d438de89d4db8dad867f4b6c50276fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad97a1a6194f6c212e01a25d9d464b6852085364670f03c402a488c16ec31f83 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b70f2f4ddf55bb7f3661fb589958115443afca6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2957ee4dc643a671fa1545353f7f9f19d237379bc1c5df3ff4a589ce78818d6f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc6c334245a377f3b3b39a592863c4dd95481eb5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14533193321d8394f98786508476d5854f3968c66d470136a1482219129e493d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e474c44832ac704fae1a3495b15ab1ed897460d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22ca9233b401a4c57836153de473b045dc09df78366915372ec5f105b71e72f4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1696f5863d6c0dc5b1d0735418727de0b111367b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe804736fa3aa4d3d3835f8387dd67180816be3dec4a1d9e32d15bc1322008fd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59e4578360c83e0e9a00046f128903104dd6813c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10c5935d6ae1d06ea63413761f07c0c840ca08a38c1fe73e6b68020a2ea271ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c021fadad601a54549143c5eaaeb3dbe634ae11 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90603d80983fad3b1a5434798dccb30349939b057c35bc00e58f8b4d1755e2a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03f868c7053a9f9309897fe56badcca32b4e6a58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ca57acbf630fb200f9bd76f37922ffaaa74ebd5877310f5718123795909de5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdff72e7132d80923f1a3aa27678b5ad1e1d71dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c93791f16301af347bf5107b90cd032921cd817e98054b8b7ac5f2dae453e59 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96e6efb006d992598444a3b9b9ebde8540fadb5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ee13c72a13f699845ee47b6c56984d3ca27f362ed7141bda4f703d985b9c32a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc49fbedd517591a6d56fee5e1ae9ff504faee51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f237413dec67cbba75923ea2fbef446846ae322e3e7c3bc87074916018cff8fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1df06343b2923cfc0bcf2f7a453e4de6cfe3fade --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f01c92b4a4eb16bfc80972b8cbd3cd8d3ab417851d7ed0294ce2376b45bfa79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0a85c3b2c979892bbc8b4681791a1bce2999803 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c0eb868ca9d488787ed5eb61a72e200bc7c9ff852742efecb3cf533877a6f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d28bb8153743e998c7baa021c9fb9fdf2082f99 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d6b4bdbffe3c406ad5a9432e82d0b344a07f77b2c579799fde0bf2807cc282a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8dda76017e80f7d465d77ffd0930cac178b239 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f977e0f8d57f9277adea586e44b3641456f3dc7351b806c904aa5a173760f3b3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e07fd2018d8ef0114a207713d2adfee6e7e0e24 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01f0dbb1401ef81026205afaf3c4a4cdc06bd4e6720dbee7198d78d46da4b640 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c933956889828226d34f32f3e0bf4cf2d452537 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458c64bd69693313821c3b3aa531c779939457277f5c80d3c9df805974d94f01 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d68a46745e49c7d151ac64f7d45504bb7f3697da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8c9435fae6296becf12a08f65c2a3c836f88dac030470681e6bcd04176594a0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79e7be14c9236e1df265c4f77f6cdd3dd43aa2e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6850ad76b5816c9e5e970a700aa0802114f78f87001bbeef03c55a3febfcf6c9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c53fa3519a15a68f4e8a1a55c18b2e48cb8f6bdb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f47b23597ae322ba7ae12bb363425a16b81444f0b94afac2e1ecab3ed14d2c0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8d5948c38fc5695534cd57c87ffc7ed0b437edb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920a0b6606ad1f9bf54321e362f4ffbea3aa8f31d18436c74f2dc098d35b36cf +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7610ba6ff8c6c9aa1889a12d817ede56fbd10a15 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:245406d9b5d247090d82cfce7d9a7f2923a5f03c7a2fe83cafe3d244b1e67565 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e892a35af5a59bc27bf13289f01c395943da557 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3345726681b99c53d5fd981750f4a3b55ede57e89df46ae55a1e12d3d6949652 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d04dbd1b05987aaa807f4c84b9a65b6f2fd23a9d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c191ef4914453cf4125a1f4b42baef937eea83dc0874316fe5fc71becb95ca3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ee08206aed34bcf4e839370df96abf0d7c1d59c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:711a9d9d18dff3c3edffb31d22cc4f929d38126a78cbfb05f8cf12798eba0ca8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e0795a6aa56a7f29271dbef607fd68e30a2472f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb155408d61f0030188123c3fbb080d57c9f7428c25d80ad68ae89170baba9bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc429b89dd801bbfbcb2794e80db7b9482e4dcd0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c992f9a05909c5835769b331d8721f24b1854c097c06d85390d2e26eeae13613 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba20028c802bf3d587a4c5333aabd16456319323 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:debb1a8446a69eac90b4ea7605a7a493b46a7fb752784ef1b8de6a1d086524e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a18169c04f4a61730cffbf3f02c1b5944a3671c9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cae27361cbb5e456f67aa2d55ae867a9ba6e5158b2c3edf030e412d6e572e01 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12d690bf97af4bd1c1760cf90cb165fd1fc5163f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6468aa0dccfde55b3bbb0b3815cb5523d7a79ad12371f7ede0ca23367c623447 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2b7a7c9acda5f7ad3fe8394f98876b98aa1dc4c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b582e9819b489ace7b33d3b7046bff2adbb2aa43e32cb5cd54932366ebb928a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad700a635829007d3995811b1bb6924745e18c5f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50481305cc230e2bd5459bf64e2b61d83b7e6b6cde84b0eb97c5908309e08339 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92cc205f0443231ca77d96bee84cadf166b88fad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a1be99025a3fd66cd0586ca2e3ce57b5edfb6157c56db1f6e4ff092b89a1c50 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95f04802ddf1418843212294eed02f303d0e5039 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc3f292d587ac18dc0879c799db5e3f8f9955790caa47a147b83b1b730d6d18c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b269df2313dbf411b470cb56ee11b7ab3f50f750 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b0d06b741ce575526ff736b4fb763e3c363d0d71a8f0b313f398621033e4984 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bff91d6e01290cd92f2556c607b5c3e82e974640 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:560a45f9a81231c85ab97b1538e97aa5bbda8dc7f1cbcbf7c04ac53cbd24244f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dd6cf2dbc5809cef0545daaa4a20317664300ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5396879d1c1f3d20dd21ee8655ba8689730a2c1f01d182573a979c1cdff5f876 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2fbef2ee1e8f03707c298745f98bc02ae808f46 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e84452996cd38cabfe908dbf9ea11d7390066876c7ea3443c76c307a4c0e09 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f56638d4c33b2223923d35e91b9d17f972b4c64 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c407d90a16a009b4dd7b75992c105a9589c9e9c3dec4a5c15ac161a029813e73 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ae57150056b565d76d1e9d74972df8bdcc57e73 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:896315115fe63bc3c67b6626d16650a3b5a407d878fd22e617bd325874c62d55 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f83cb131a4ec12427c57f27c589a8a305557de9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db43a7f0ea3119ec3e51b18cb8fb268a1f69b68110592481ee4ccb3676c4f8bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e780558a5b80dbb13202c37b0834fc8b11f16a36 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e83e47d3d8c3f921e09f0495f068eef0ba8424708c8a2a66bd220b08dc8000aa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f5bcda8aa2f92cc63b849539acbdafa84ab9e2e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fef82bd13194fa45b1d47f0468ae9f3f76ace0a3d54694b7fbe35386dad0d73e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab67074984458f952bb48fe5d683fd57f6c6118c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3de4b1d41d254f13e6d04fc6a0e0f575d9cbd4545adfcac822330cb054d986a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cea9ce8143f494c72fc5a786280cb61964440a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855e2c273bf3a5dadb7b3fc55fd69bc3bc004c3cdcc9980cbfaec910493ea1de +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f147287e4a6c988c92ba65108cc5d7fdc34832c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bab5cb399ce2ad5f2c045640a3887fd3b645a89a383fb3f736145d0465ab614b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..24757cd762f4f2c15da7b7ffd0fea99f663719fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d5807615c5d936c5ea46a6c1b9ed5af45381006ecee0c82137c9b7569da264 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..876e3f5e2377540bcd4e65a4bb149b736dcea964 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:614c872a477b3989a5d0b8d2536ad4a9100fe7db40211851c2cd61be2f28bdda +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..276450967b35f8d3263412a1e5c8e0c66ed9dc5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e39e460cc123516ea3fd6fc95816d365d6e83f4021a3bdea3809faf0b8f1b0d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce2e661ac3a07ff936d8862de9722fc407f47039 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6507b6d7d8b4f44fc31ef037b258cf58074e6f555b9378ab1a10f817c590d9a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..88d0d1fcbe35bc8fb423c37f4bd26a7b727ab730 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d97e34d2cedd32d353e22475450d8ad8a94ae43eca2dcc01a46dc205f9238f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49f0071093ea4a8649258a791d34ec4b1ae86b66 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7be494773c6596a2940b8086422aea21f3aecfde74aeff63ef17df362fe75581 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f411311fbf534783e794d8482d672f283b31a6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73ce9873939955e43f32c0a6fd78b59a7bb575be620664bffa0fed87ed66692d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c97c0e4abc77993f1b87b49bdfccd822dc305af8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c306604d798a83b36a34976b6afafb3d8b176c4707b43e16bae484517678e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..16838f6cdd4b26f4810387bfaec1075627a5e485 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2beaeba06e33318dd521352da0f792b0ea8bf4134862c8611adeb6cc87ef358f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de7ceb25c8ddca3c7cff4ee830078d194f91b66d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d2178ba45ce6890157c963fe5e8f5fc15958d237695e3cc9719d062a67dd50e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aef7c0db221f306159f5212ed4b5ba44ebd57f1c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e3c461178ad7bbacddad0dc7026bdc3bdbd7a8815154136a1a4338ab98c3c7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9816664f5c2ea2bd3429d83140f285237bfeb6d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff1692ef3d397bc757ed3bd6d65646a5756b2094e97660de8cfb5702575163dd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2493104257e9af41aac11eadbf69e56fd6fb8a3e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8b52a389f69f03e495f9eb7aae0688c6ab9f3ccf9ac29d01631d1a776f7028a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f17d3d71389d018c8916b35531d0732e19498b69 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d45432603731237a5cd6fe123ec42b37ac31f048ef7097e0df8ff5577bdaa2ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1888721e02a4a6473989dde22970b7dae156a35d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c51df046e2d16b2171cf944ef04ec276fd671f4d03b74b3545102082e5e20fc8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63a6c74b5461f40024c96a411d3a2acc0bc25b3c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:574adf7a7e7cfee52f462c96137dd3c5c3361d9fd57c96b7eee7729c837cca72 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c092f6906c573a3166e7c1e9e70e770d95aabbc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13cb1c5cf0691affaf94faf8b6f664da7c1d8880e6c343073678ccb60e64a3cc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1759451e43f8d59a1d909041807c0a626a0b620 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e55cefdd1830cda5a9f1d784eebfff6bf92e068c69b01f63886b4c14721b1b9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ce32c11e0f5a96dc50da36f6868119bdb6834f1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f612559ea96a34f6203737ab400879d2b2350638e1f9cd75fdda84b598200b6c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed3ce2b23d947e48c5f3919a6606815ddd0d3be9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d684a888fbad868397e8241b1abbe243ebf90c154025addc4e23f1aba1770e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c89b23ecd26b4ee236cbc3894889498b8f9ae5a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54386935add1511bdd88a9c34ea6584e21bc67b275cc1f56f6c9ee3252d798fd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e0b14a15e01376c4a784ed2fa10e26e5486cee5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72c803c2eb925318dfbc993710be62b3b3c820aef0574081863e866ecd7b46c5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aa46b011c27b1611ccf4c6d19f9158f0c6ccc35 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df803b839cfc000a7e36dfb972cf2cb6a2cf7f4c6f68b4e193cb6d15e543aee +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce5b57a99130424186cc9cdd949187bd731f0108 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9488af3af72e7de2d7efd22e822f3bf38084769ea68311bdab465fb85eea4ba +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcdc5103b4aad739f6d75c74f774f49b60750e29 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13fe25a32c5c4b67040a9ce245915b574c2822c2f1328e11496733c0c0891a02 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe87473e099b95c32363a9a2ae3a1abc3d1b6c5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99a5b92e3da105b88e018e2ff1e18887b93867d655c056f775d860fae2329e91 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4a24706c369c03048edc1512c83a0d3b2f0cf2e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:718263ca205e3cce6abc34a790da8cbb4a75ceb9b830de5baec4e19809aca817 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29266f8dc6873497762add71edadcbaec939efeb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8b97fac6bb732d36e79a139e173a7a7cb2de2337832e12935454aa294cfe4be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eca6da09a8ddfbc33efa12f9624271aaa9e690b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dce8903969f748ec0292ec5b1ffe618cb890f5847be8e2573757b6c878262f78 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82423fe18ed0f6e84e5b3cf866c0bbce19e70ce6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a549cf7b61c59ea24f7746709d62c7672e5ccdc7f3c4443cb88e2ceb514348f4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..58e94965140a8dc4643d9d38182c5731b058b606 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb717d0b6f4cc3ae49c30009fdf18106af9875a6c548326728391bdf4dd148ff +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..697b90bfa02fa529e46180b7c3af63c3aee2a26d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c2055ac015de8efd871a726f538a9994fc93fcdd2bb1ff68cb0dea7517120b9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a78f1fcf8004284312ed4a1d20077bc43aa8c16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8692763fcccb635173158880b6d38bfbfaccdb457695e9682818ca4b90e2a717 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1010e24d5fc57a5be5fc9b897e9f8e6ac0d9080 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c549e1546984f59980fd9c0d4e59c78bcf15174a6505ad6577e703c724eb2d1a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..41dccfc78615e8bbc0d2c81f8732c8eb22efaf72 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9a769388c086c755fb9864d477611fa1882e2853759f5d86267c8bd3da5c8f6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e93cc2014f1add4e41c6cd08050d85343ec020f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8791a3f61381761dc76cf030399bb9193549f96b1624bfe302c0d555e0dca9c1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55ed8b1c599aa73cd861e79b16f023af45379224 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35030d76e9ec5fccd15b80405e4c8cdc5b892265856e79c2e23ef2c04266de18 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0299573c0bd5cd2682e75c16e981c9d1ed5b3e3c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d06bef771831ec6563faef9f6fc4a2494fde757e97a1ea9b6ea51653b14387b5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5133552e68d411c6e8e988d059418fdec9099db6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3325f2855ddf57a45a5878b96df70d289c9f0564f1fc7429dfffcdc3c46de458 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2b9a6aecd769ab36903d65f738b4499d86515d0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:693025752d02940aac5ba30fdc3797b001b25e7809db8bac8dd9461ac2556c36 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71eff8b110b07487619f98a79c96c6ff0c3dd5ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ada7403017efe3eb8a3ad82e0f7fb8a99d1bd6a4091bbed8675a726532aa188c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..931fdb2b51e4efb96fb744397e4ad459d30538b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bb0f46ea3583a4f8547ca3b3ad18f66800747350c3484849ebd40737e45f1e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cbcbb12fee959d134408965a31b17ed2dec4729 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43f410bb8a1c2299bd3f25c66ef4bff02d1c01837c16e0dedf037f5f6cee07be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..121f2a2c97c2639204c9004e7bbf5ef045d207c7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca3eea77533555fed9a502394521835d18931127fa601af530c8f937fd73be48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6e58ac4c8cf91be627d01236299e4818ecd099c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bab5be9ae6e0885455d829286c5a9e2ff48831f34687d8b8ca5e5b22e4e99ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2db24bab76dd6d6febccf416def6d4adf4a0b6c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9927856bcbcd7dee4c26fadd4f0d9cea0e116a15a96e5cc8249e1f1a3892a858 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce5a89bfa486e614712741438f027efc2d139a05 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d889a6f72726453a60c8c0f0ed52b971eb0517fed1b71f11a938a7b7c7cdb97d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c69b0072758b78a617adbdc04fb91dacfb4969cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35815d5be1da09082232a0065e4ac55e7a1a5f0c08a39f33932184d050347ec0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b4003fc3d7e56866c7e43664ff62f6487eb1cb1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:520e84c7a87ceff0877d281148a7b84e480c1dc8a80f036c4e8473aad00e17f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18a1250068e96cae41eade4bb09365fc6e578e79 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:746b7a433c6005f48973c105c877bcb8dbd2366f0d38551c080ebad449854bf5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b5039a0a0cae29db4e46d2b0e9ae4ae3ca9f433 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea938791d30e68f20b363fddf549dc15dbb9203f58b8ac2f54a506689c620202 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a30bc31e9b3272e97891dd675986af9fa9363ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ce6054f3cb0ee984d05a0765d3cf32721842253ca690e714de4ba09e7d0cd67 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad4caf42fc83f6d9c0f9c6a6daacd6fbe17297ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93dd82b4c43228a6b75743328bd6bf82b18911a350c99c4b23069f34fae1b2ca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de4c932c9dc8d48a7411e9c89a626be62ca11884 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc56bcec9a39053a837e72b8573e93483a1dd11270ac213e61fe71bb5f6818cf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..87a9c22d7c56494d2048532bbb368ccbe44f185b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8034978ac58c02e7f55baecf6a96db088452e1cd0b9b59fd084bd83ca8b5dd44 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97820a71d9a81a5187f3610059f44fdc7950b129 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddcf2ed83ec61b83207aa879f2dd630322eda77afbc5da98a8e06878c624cc93 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00a944f5d9016cafd905677574830aaab82ffe5c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb7541bfdfbaf69c7fd2d019f451eb81e9252a7f9ef5a33b9820b3c6462b9e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14a591ea655995718e925d74256e1ddbbf727a3b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5eadfe481b882aeb2b132164f64d9f99795d440050928da405a6597f3610715 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a061307c936ae0adda192ce8f436c6c4cdb0a393 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5672fdbdafc2f293fe0b26b2fb420f127451cb4adbe15dbf738ed33f453d8c1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60750260b6e4c1b389ffe07c7822730b5dbff9e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac3fc652b94fa4b2ae7a2c6e1b01b813c9b825ec05948584cb1ca376a13380f2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a52b9752e5bd7cb353354c0b509172f24dee2f1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd6e02a79a60625b29690c0f73f2a7698e7fd21b8c8ea7476c8a30d4c91630d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad5647a8f913116337876b273f616c3f916763fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec0aac66e0b29f653a90d45c11852106789259ef2a2381225805155f0289af48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..35b03f85bcbd150c7c593eaef631612b776979af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73dc948fde9ab41741f76353d812e4c586d93cb52412a7b5932ff6c21f0bc0bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11f12ce36358d14ddc067106ca6f4d86dcc44977 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5814d312e6bc244d3657a531dd54e5b16bb11492258d21b9d817b41d2aeb0dd1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbb9b0208dc2345cf46124608ea102d71fec36f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37bb3713f006460146a24e9391b0234b1cb52056fbd652c15d83b7ec4a716549 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8382f3d85c71feb9134409b38f6b79ec0e581852 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bfc9e838256d32f31e8693ee2ca527461973a463f0e643f3c8cd6ba8b5974e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..85149abe593a3eb2ad8510cabb97448e42516268 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:613cb159ef6a5ba8df68c7b1464b3bf468ce244503884c8a3910bfd25222ee6b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..deb0488fb12f793085cbdc9b866af91f4f536043 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27f3ec0636e94d6aef9868384e6c090ce39f76094ed5c3c1c4608ca959087233 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0271076bfd85fbb05b19592a3a36921398c1d5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce1581df44aa47c8155bb6e598966582dc101bdc58bb020d600d43e74f0cda6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63a7a2ae30d65ec5dd6ddf3caa8848b95c194506 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a52a6551f37083c21bb9819044be7e3c3e01de6b3d4f94ab9a49d4d7d29b14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a8d48c4abf8267f73797c4ab5409f3208373c16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aa8ebcaa2e9f4de591f9b76ff11e120bbaab8226093fb290382d4c7611f9296 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f70224620849887e4a4ab3d0a4860a5f4ba6809 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5baa7a6336392974de130cc24a87aa613d96ff341bca52f20ce5aabca999160a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed0413a73c168e4cadea83f60602dd8c6e2ce56b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a82f1a82e832b9b59bb78ba51f61d0f6f5465792d504c010869f72c7aef148 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2cd83e83eecb2dfb2b1b132fb6610138ba26f97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbe188313498b48822b6fa41f63f7f73b2cccc869818d1c9d45b52339271a529 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd1c2a73406af209533df684b06c7dee4b44a98d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d32f6f04b68e769ec5d75c6a897ef3887f729578078d0d261344d1d248c40c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..753b408621dac17fc6c63764a176bc3073c57c8c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf5bb59ac0fb9bda0c557917c8cb811f46d4ce10c42487d34e68ff7edf6b5aac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f1400ba438dd6e6d6d0ae3cad082cfb96338ae7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82f598883433f2084ca603bd4b6f4629315fef37d5b9d940be268b835b7a0eae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..baff46ce2110423f351638341b11b46a865a76fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:148f27c6c6d32c250b261966889ea473b619e6a8a929c23b68df6b249e7cc076 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..10520634386b057fa715d79192c269e3e96dcab3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56a41cb5f5561dbe7de6fea95752e11536a257464c4a99ccbae4441493e75dc0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2faa40159ae94f8f183615a817815c2ed93d93d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c224a05ef1f6c97fafaecaab174fe7c8d2b1ea33a96dbbc999c8fcf741b45a9e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbf48d10fe659b0c1a736bdd3f5fd4bb15ec73dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d724202c9bc6f9d2da52fe475172d70c03ff4219cdcde6172994acf6e62961be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f929a8992442a52e0bc254ac90fca627f3ca76e0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2ea2b82da89a177ac0a6ad078c55316462319c228a12da737e3f5d13566031d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5263e761fbaec7710b13673299e5c499c4af1608 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99d09bf4946cee41fb39e88113d0313c7684cb647fb1def93b8efd28b343c21 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4c323cb88d084439c30b2618a7d95ec44b6f0e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2887896934e994fa5a3bafaa5e4e2bda3dc6155ef06f57808f2f0338507a960c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5abb5264993c34792a35a21e9604c390b7aa0ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9239e8b30070092bb45504cf145aec09f9608684b530c119af186bd2a78dd731 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1580693125b2a50dffd93f92e030feaa50e5de5c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08ff1cd654f6b8248d56e0539ee4c2b1d438c16be8e3e8ec3546ae5cd1de603a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0f5aa83d84b76de0a37ffd82cc0ab0964f78904 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d221cdad4262deb60aa6d702639cce36b7a9b096509f27d00a02bc081695cbd2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5600f5e43bfe823db8d1e13fced146cd0b51e7e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:509419e8675cec22eca213032a7fd27fc5b8f95f96815ca6c82cab7007e503b2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..84687a5f45a1f4437e9e18fc26e3c433353c2435 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b84ac3a3741f63183921d13a1d601df3fd5ed2f5496acac4cf37ec6bb81f2d51 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8730439637ad74bd264d4542ff99c4838d0fd4e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fa11326f3f8241015cee35eb01ba581c52d041bfefcf93dbd7f3ff628cb2255 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..23136c66fa2c3c05eca32806cf6fdaffff9954fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:931306251626c2e58d9c383aea7ce78e2415f3282c9d7677a6be52de4115c62f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ebc81168d7a373d63a246f5248f48b10f58ccb4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d583e814126fe7ce8c9969a37e3b8cfb6e37f8675905ec16ab9286bbd13690f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3cad2fd39d41c54a1a0369280ba7326bbf8d5a8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe3ffa50355341e8c467607545d71e4b769d4b9b24e09ebe3db3e28a9d4a94fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06a55fbc67ae84f002618e76b8b590e3464c370f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1467e0efc0a97dad2a1af3d98bdfc5ba0dfb2c001b2f40f4d269265d7da94e6b +size 11395