diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07a65d017a805e65c9351ea83b6009544b1119c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cc74003721740c83bf8269196dc7ebfd72f615c76ef4468eb7ae117c81fa7b3 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..452769c325e905e675267459e7650ec8d6c7a39a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:445e3c2ccaa7c9eb9b994d60f08ba66762c76b740060befa29d32d07e7d11a74 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..09416e5643f65ac249870ae274d376b2bf2f7dca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a3504d8957eb96d1d74888112ff8884ee67ef7827f6ab37ff17fb89ba1970b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2cdf9f69d55d399c65b694e9751695c917e59a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823beb67d0e3c07a17b685b13a50bb7f74d87d94160628746fcbcd433f71810d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54e0d46654c87ec66ae36b897474ba55238662ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb2553e4a199fc3611bf6feaa64fe0b2a19d67db44a63642ead08ad64a54452e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..009545e9465e3b7d854a6b10493bee0fe3a1ca33 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:961bd3ae9483797ab9a9b1878ad44a63b7a180b063b0e069f2592e144be5defe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a25b86f525e14ce2fa4227ba674471a88820dda --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcabcd15f470003780f590b6377438b6a98b5b8dbc1df1d3e8bd7b8bb0428aeb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74de532b4aa43067fcde69b4d11faaca493ea8fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ffc812d9c3608e011be259be7bb7dc9a7a25f00eb0739df5b2382572b7f8a56 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..60b6fb2fd561b6652082b1a37d748c619e2a86de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a19d8a3d266e7000708146c5dbc02c33b067d88d876b5c62280a7e966eefe84a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d29a31587c23c85a51ba027a60d07757e68ae624 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12b9b659398f605e2687fa5c6f396140f1914eb04bfc1f49fa71ca9fd1eec0b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..60f0c5d91cb9bb7db58247190a03ae873350540a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d5514fb254194968e2f1f5999fdb3fdb03119b06a44e2de7878c36b230f7f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80a0984a5ab6f22152b8dbebab08a447a31a3a4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:801cff73181d0f9b176ff79693956150867ef81b87d6f0c8182c8b137a0cb5e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..042b715c70afbf599aa21495f48d805d9404e620 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb970f8e1adcc2ec9e4307fccb329ebb328aa3d18e5290c3c17eb4757f6060cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6b26bcf3aa942bfaaba987951231ba91da784ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5a8b2749dea2a55b8b82047aea14917b5ffb4852e230baefb0fdf8b332a04d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f0c20345fc9cc9051d15422509515c35209bb71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08c3ce1526b7d822995f40ddc11cdc51ba6007c8ad10876f5db5c742678f096c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4993c5cde989ba9f35d4c46ac51fa5ec220eb2dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d429970c8ad0e1dceb87701c9757a0d27ff962d1880a22f1d1f257246df530c9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f51ed9c59a7a4120bb0e9c4ccf96145d573bb0c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc6199b1b0639c5a0813c050314ff0a1bc5e3a1c2553df1799002138078904bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d92e2e8fca9bd1f99e7f406762f0deda379ca11 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86242ae84f35ea0dc94a1675fef1df0f654cc9c04edc7bfb741f96d6ab6a5dbf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..930fe7d5dd1ab9fbe6f33bab20ad44590bfba4d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6733dbacf04a034637ab175d1d0ad89ca3cdcd0b9fdeadd6d5f22204cf34d2d0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..821832e3d924eca683af6df69b06e4d641d33b1f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c01e785ec51176517b7a63137fd9440d221cdc61942f1d2d550dbe75f2e4750d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd1420fc1fa2aa3c2d985b9773b7b9407163e1ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c070f9952a18fb1c8dc04b0fc89c16d8a6bcdedad16ec4325cb5fdc59871681c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c0b783b53269c4abf0c212731351a1851679213 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46f676602f7542835e07cd4aca87c268aead73f1c79b9bb5cba908b8b8272fef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dcd29aa9a4d1778f85c9cbe81d18812916b162d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a1456479441ccd246bdf4aef5c7aefcf42ecb6f87ed5c615585daa9f00ff096 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92df69ed4063640d7a7dcbe13e6f2cfe981d5e72 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08b92b471dec0e0c9326311f9bd3d87e598c6c58baf4744c8807ab4b1da736e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de149e4d927b1d7b8adc00ee7f60ac49a529878e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02099bd14cb4cd7976c88dd33f5c4a350047f70f35c3b6ec8da2615c356219ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44f9d88ea725221a2430250c73fc9e1f101116fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07d90696e419e37e7ceec28b6536ca92f92a4c80e0a626c5aa22871a3f446097 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5287d7cba08d4b1af7e7a726b90229a8f414ab7d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:316e94ab1ba4425964e6df7dedf14d056d7cb7c8a15d235f639621e5ca677e50 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6421a0e05ad41d23d4b4327696974c369418b52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48b686fb00e93e77bf7ec8231e7f3394248a6b3e4130ffc50f56458e1de3fec6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f026eb64ba59cbf7394d83a8b71cd9207f97932 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf4051d67b6b784de969a25cff0769c71072178adff91e12fdd5f8e5e8044b0a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89a3b439c1d605d64897ea032f4a815dbd31c9f0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f899ece07cea02a76e4a3bfd555749923283a34a17b8b6e3153005306e29d0dd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..14eb47bedff84f46cd6fed4e0ce81a6cc921daf9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15645de982f52805a46e11ea5053ba4e37eb5d5e2e7daa55265b1a8b437f513 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93017031f7e3a183e196c48401cdabd32b803f45 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a161d1382ffe1ed876f2989129a42efc49104c8250aceb1fd579251e70e08c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bcfbc049de79f780163e947f5214835f192099d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76a8f0be7c97f9c51682454e5e898d093b4dad7d3d246662bfb761fe74ca69ec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e206cb2b7fd2935aef116f78a153d16d8f06bcd1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57e714094dbec95fbbc93364a178bc13bd14f229ec092aecfc63e9f3773ad0ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e72d5f9364209a88e0485bd8c1fa88862c68309d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:635b973f722b9bb87bbb813a06e0e023e74ab2af7210c06615371668d476d540 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0506ea1bdc45ad4ccd4129d66176e8726d45c49 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac89b3245e33644e09fd177ec67a3abe7130d545ab4256b43ba77e290e9199c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b41fabc0b8fd7801e3a5f2d1811cddba703b44bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7536328fd8a4573cb498d5c869f129f2c8025d22a2d767e5e48e80ff1652afe0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc4285d18f133e3fc7c8ae3c7c4ab67415db26dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ae70bc4f7e4be67c0fb9af5b2e9bff31b1c3186c358fdea185309943426fc9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c8f669ced4d90836232d57a5f422c3a67db4203 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4b978718106b01a660b45896f689d2002291f7ea9ce83d374e8a2a0662a37f4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51a5c2d3ec6557ab149be7f274b287b697ff0e87 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e5bb7f69e9b31959e9adc23db6142ee0f5cb616cef40c847007339f6aa3db2a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a71eec3dbde4488a188ceb758467a2e2bd501e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:533928dadab6171e6ddca2c615728e7fcab4c1484005adf3f63caa64f0266776 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34c8918b603dcf4d539f8c3e484bc7cf86db2d02 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39ac4c017c3d702488e81aafb65f7478099cda692a9786440db337db2cd964f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdc17a1a35887bd387d7d8e8b9284442398ae886 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5785508667a0217b4eba543cad140c158f57a168d00f7e2f5eb9a0c189ced944 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05b6ae2cfaeffefda77eb74a36fe32870524df6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5d3e0c967f92d09b42d567d0f4f7455accecda92ff0c3212c99730bc89db22 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d60811228ae0fa80180773ff7bad9fac32ba2da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad79fa623848867a41903e52d427fc0e5d304bbe80f17bd71c7e1ed9d4ead15e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7fb8d461431daaaa6da98b84849178264f28a14 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fd0b3ef14d0142a22401eb7c696708f71906162ed331e4a41bc5ae305e1c7ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c25116398d7455236aa841d9ff7ab966f3ad2c8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f543e24cdfc87e3de3fbb46f9386f8e6795899339930d88be00e1fd1c4589054 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40dcf5d93e34eb5830ea14655725132c952fc5e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13d632a7cfa1ba74c4aebfb7edccd02fd1442a30fe44d9e229003baeb95f2553 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38dc65a410671246a3b77c166466cbe4a7cfd686 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b132694e36fad3950ab47800f3db1d871f24c7eec6e0081ac343d71fc5280455 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66ffa94da06d48777526d0f0b611c5498592985d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:895f04f2d809784de0b4f851777d87aaa60bc63cecf277eea14a3aea4f301732 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70600475bae36d0d2df823677e751a3508282039 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16712a5fb561cc741ac9c414f5e56af43da15f22c83bd8e074984481095f6cb2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88096e629784f401617acf714c0c30e92bf32889 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1336934f0a57d24e73a0a024db13cfaa4d03818b26567db5cc6ea80f82be4df1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..342019e95090c790a54dcee32a41f94681fb74f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78069189462d6a8f695f2fc8b7b0328e50d14a47f066d1fb41da8fc8b772a1bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac2ded84ebfaa96d737b5e52ccbbb5d1c164bccf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89fcaa70d26a804c907f86f027cd60b7cdff33f353a90db501469e909674b35b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6025a0caf8dcad2c67f1a9aefb2b44421e9233e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:194d936478e77f24d1c54f93d7bffe89eadc10a1efa137eae295617d69d74f4d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a1109622011a44952c0f2b61b039772261f713d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a8910d4b1d6a0f892b24e77c668785cda55343b00b075b1cd4abc87b25e8854 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5b21585eb104d55cf357a0b9828cec9b63d7d3a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfc50284c87acc232754b08b6740d38b4a09edcd90460a78b36174a2a9473617 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b49a529d73966915e34b88f31a82977d0d60a377 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5b0c112d2cab4302442a085a2df52561b97fe1d6fb79ffa25b6d4e2cae2f29e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e09a0750e5b391e0c406fcde94522c00a7729a5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ebe083e39a8b382b4269e8d4d86d1aa44e3dc73f00b30fe50d49549dcf1a00e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cabfe44cd4dfe2807f8090dc9b799410ec8adab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b5bbe94af3cb96bb9633796f55e6906777868d7a510caeaa562d88e678887bf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..577216d5180815391e11fa5e2e62c7b752166da8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baed94309ed239c8e4907eee7164c90f73c52781bebb1e754124c64620cea4f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec0b1a724177063ee8f025a468ba38b0ebd6c4fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70b5b30a1a47eb72e2ba3fcc9c80d2195a5932f9f1cc9f725b3d25fb9779eabc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70a5ecf3ed1cb7a12883822154b5b780652d34c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c5d3d8903d186bc892268044999a38117b43e7b363cf41af9b91aa1d526030b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96fb62d76ae059aec0f3262ca946482e9690e009 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:435e43614a6254151c99b8e6575ead805c248c7c895aa2cf07e9e626ddb5e760 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..51ca1a6a00ff70450748bb73bb93aa13decaa12d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81cfd34d6fff5b581fb977cc41a8f23277d06a76d9341a4fc8360658d96711b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fb36a6806c005f23f9df8b25c1280a4e4fb7fc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7489e0fe962c4150c76d0cfa0059d9f8632b9c733838ec71d2d7fd8b90161d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1daa0b5d836271f6767db94c949549db3dfbf5d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e5631f1bfc8f6391cd389f9c584aa9ef95760613177da93ebf4bca3ee37e90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4a7e8568289a053a717a7f1b57fc12e7720d991 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70fd4af46a64aa137c2a33e4fd575e74abbc9e38ea77fb86567888b5d0241a2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53764993c9cc5394178c99a529fc1517cdc15cc1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c287c5e7c393a863cfaff7a54d5a86fcddb53c1bf368cb8d3b51ec1b9c58e9a4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8038011b5de49c07f685b3e32df3e80f2f3bac60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ffe2d64d54f5878e513698b26dfc228a68a9bbdc315b28010aea38ec75379b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fbc07d76461c8f5aaadf2cef70bdc375f77ff1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd3c847ec476ea90e8250a32b3cac16222412576215272d885f1ae07cfa3fa37 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfa82479b09550453a08562ac7319829d4b52cf8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebae1d753b2f16041eedabea94fde93d28d70ed968fc61aeb349651e7ae9e8df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b5011c380683e4d0359383c51b24fbdc660121a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3a33861f5f34e7bca7c40f558e48ea063212d2948d8573234a63a3b79c536fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d68e5d6073b07b71a9e55654ee44a05645a3012 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee59e0e574892c88dba69af85d9815372ee41d39805acca7b150c6ab6d3f2f68 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7085decb5d9298f2f830fcc7b6e721bc5e7e6db5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0214e83282e39724e6c77716e85940de9b2080c2ca750e44d46e0094c2fde6d1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8ce2cc76bd960e5d48b75d42552f91a6c133121 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7462c72ac544fe025a8bd429798b5e1ac563e46dbea8ead44b73dd8e47146cf2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6de2db0e46a751ad30c530af06e87eaaa0e276fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b28d9d13eec02d4cdc2daf2313ec8ea9151a690ce4d7e492aca6c5f46e592323 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11c23bb68b9722c23212e8d4982fd475f9313a83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c741019a79da818b93cc66c9c1ec43987df5d9c6f938daf2d2e9a33dc042ad71 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4f6c51491ba700dd7ca43d2199951a4ca8460bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dd99c81c75a759c5390748ff8127aadfcf7141da45a6877a144b07fae0461e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c0e3ca2462885736d47247d32ad74b71917bb30 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79d4643ea8f27cd86a56075bab3856e7850815b57ec37daa87e8f4a8e0cc0cf2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca5afb53fba195572b09fcb70ef1b9de26f11174 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d6f0ac151914adddfcb32059e23c29cad53be4a2425bcd909956f7f08f0ee38 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85c4d3cd179cd4c06ab027208f227fab57456f40 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3b923a1583560cc523e796aed9852a71c4a732b4bde5d600b6f55cd5d15059 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9a1ca8fb449c45c1e15c447a783c7d3521a94aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03ced47ee5c52e068ea6b5100cba0969682abfb597076e4aa994da5f5f7b885e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fd5237106492ed58483600f2e5ede273e5aa8a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d7225c66ae2f90d3136a0cfe4cde8cbc6d27f8a622ce90615d706c2720a08e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4858bf48140f6a3b557a352666ad83bd095536b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdc73e8a2e60ec508555cb398719a57d3b100c33a8b461bea1c603920e68b1c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..237c749f7eea3c446f2d72fb0945d3de32498ee0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e90c7293f0779fa2aea5c1809f071670eeafbe65b83ebcda42d08a267cd67880 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08691aaa1d7b5cf34bc4a47aa07ec7f0a2a6afe3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24860b8ef551bbfe36860919a553c0f6ff12128ac8cf6ea72514915264e23d12 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c84860d4b28905e086799f40368c96065e44e7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d76cd865ccdf8dda1d283579643b5f9479be6bf13e1225968cbf1dee50b93094 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e16abefd770d240b0ce1361c3fd3157df1dd9a72 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e4f7bf17abebae3e5cf2d03e41bb34c84d331066540a96d43afd444ddb6385 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..871e770e1ec2ba7b4997c0c188cb38c3897e5f78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd6003dc30c07164549571494eb7896db6dcd6f3f1fda0111a1023a20379c1dd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e50a235cd1e98c0df8b773c942c87fd8d3a8822a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d02beceaab8966adfb3450d721904f726eeb74c425543715397c489f8c87c8a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fbf0dcc8e86abd4dcd0d69dd1d788adde580321 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f870978f136f05d1a6216dcffda5aec746a3a55f24a4e86385d37734f07b595 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..56398eed16a129d9957582945763758e27b04026 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67ab11ec4c3e562ceac2f1c23548b97c4b9d3d29a7c488c2988dd45bacf23798 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75ec2462d5938caa6775087fe81d938f53411a91 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:536b7484ef4466d4f5819d49749eab9729234bd3e52e69cbd7e87ccc1dced4af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eddb748525b25d43675bb5994da0f9e478c84e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4abf39e94432d729e188edd6b69bb777063731eba7624f6c846885375fc6cf1e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..701481709cf3ffe533e853c55ffa284c2ad42210 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c796b64baa12729a96af10127527cc3f36db90204132792905f1d2c2c1c60821 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0267e1f7cadd36c336a6a8656d58d2050f7f13d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:402a3fa75e4514d38337364cdc3eec3005dab784418ec262f0cd091ca97ed420 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0d3413786ddf1ae383e87bc7cefe6d26137ec1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdb25f9ae9ede0cbd180029c687615ee595e7b3837ab4cb678e8d4b7e45aeeda +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b35c2bd4b0a7b7ad0dfcf1128c53f033414ece5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29eb8293548f82ef19387265fb7532d8004b240cd26e239cdf4733e97ebd7244 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d272db0fd1b1e9e75d300284cc18e94aea6d136 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ca89f7af5d05bf08ee0d51df02fa7b22a39544049a75c6e5c0fc9134d765e6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d9a99c3c013f3142229d4a53da0e490bec93cee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e80cb1071f05857d016504047bdb281f0cf9cf0060839f224b759d047ac0649 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d318b26b49e1493f08d85939b2d165830627a75d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fc4929b36c29ff6ad051443c761c7ade78be609c68327a683bcd3bad63f5d6b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3712ca015fb68c940180f8f42b58bb4d76d9d285 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc5fec268eaa4165c7471024a88decc266e40ea5ce80f77b6f26a307aa36f4c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9560fcb66b5d2cb8c68ed3606d065f982b6a3d6e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b275d3027afde974523c4ea67ff7dce3ea5db96ef2d01ac385a3ed4b0625e5e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..797a4d063f5bd83e7e82bc8a90fa7a5d0a9c51f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d85e5e9c80c04db6f5ea1261735de7de6897bf64149821a1cd7834fff62ca5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4059cb94df450760978897f4d73ec0d9beecd18 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da186aac5ef580910471d2a314020b81c78a3a275905c95fe0eb4f30b11e4e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b428d338652cc4f76f803f534b1ec52404b8f6d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9cdbd532fe06be9a4b36d1259ee06f65958423ecd301c3dcd999805790cc3a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1871b9a61d9e3d827cdd6f1e7b342a6a0bb8a3f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6afc62eb18202c1023e22ec57df1dbad88e5797235f9b2cc15912cc8892d93f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48dd69154c0f23ff9c90f1cbc2c1cedf629d396b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73791a536b622b0fd4e7640140327d4902d991225498b7ca5283e3dc30b635b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..daac1701d0e6584f4b565ff08d2c4c157d50eecb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df534c3fd31b3768fd98a20295c43e2a25d61df3d815b90df8df593f36652a96 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..72cbad2e0dcbee95a4f3b3ca6afbc8270145793d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce8e0df69e175783d3abea17428ca1113227d1c39897c77b1e196b71b63d10d9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec3fae716a5408082e47f2ddd0563ac27e0adf71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb20fd51bdd6d066c8f6c1102d55f72de147baa4331f28d7e2339c5f60f4b96e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7d2fbd033b32ff2e232ebd77f8507cb0b3a4857 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d89fdaf70764babde3d288d9e3caef0acaf664ee156e7daadd9a65bf40c03e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e4ae346b549e1bfb5e42ef9c55a4bf7a54dae18 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d4e9cb61e6ad04a949ed2bf47578efe4652a8f36c19396d9cb4e143343df17 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1499003e832b29ea69a4361eee9b35f1a3d6f203 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6503a56706d99fd99a6a96503728c86e10a51de80773faa3dd3f13c154c8734 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e841935f57180f13c697ff3f90a8e85d6c01f059 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d377b547b1baef747772889fd830b3208fa2603bf589bb74166a680f0b4c5a7d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9604c9c57c040ad8be2b6f2a6af4072a43f2629b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bde674ceefc5deab586ba9743148283a6920b344d1fa27bd492f20017b72db8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaf8d9c17a9633f03537cda5dee7ed32c4d0aff4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad0b7a68019491e00199929deb074ac531db33c5c6a5e97e07c8fc30b2657234 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38c10335cab500a17614b87dfdfd5f0a0a6191ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67103525c2c6661a74683c2c67814fca68c9d72f68d9f999571ae4e169b8522e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec891e89cfb71eff167a726ff353c71abbcf3b28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7bce83d230c97b582f43ffa7d0ac5104887a993653bdb1d674db3159d8f67d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..feeadbdfdd90385537883b2c882c97410dec85af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb9895c6211de3f1f8d3558b3d58bc45b527383413e81bd637045ed52e299db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7a41460f9c55118705c7d5860fefa056d5004f0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59d320f152b60f7a9989f4eb5fbdeb9cd00be3b24732ca97d1d5711f92c1b6dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeb2e4e29ea252f6f43f32c6c31bbe34fcf446a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80cfd1c121123e56488ea2b580f71dc2f3d7bdcfe7a1ed361365a4db877c129f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e21b12a7fe3742a26c49f4f2290faaeb28aaa22 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5de6ba6220ef4602efe7844bb01a037301d8c58e29c9a6aea48839f9bf172c64 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..17b6f4fbfb51f21ac7324474d503d4e5b8d30666 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adf955c3c99b318caf8e8501562e2d903692c38f535459c752e6353fa9401382 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f7e1245c4dc0e98963ade7134def506fb8d3935 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88f3c7ca5a3b1c97982688a25ebcf3b0b95fbee2c998a41ba6618e86fdfe1cf4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b984bd7116405c26e0858390c9420b4a3a8f174 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1db3debbb340b0bbff5344529e711b9dc8521a1242844a0ddeea7c347a0e19a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..996efa26b708da9a794831fe44d3e8c9dc8e475e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a50705de41b9444ac6b81b6d800ea2f44438e5af7012f237072074d0a1886e52 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11463ab6ac393aa70907ffb419c15014c090712f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:776ed8986b2ee26d25725b558162b84ca2554a663bf264d59edaf6d850499c15 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c715b7db111e6590222c0c34682e5de1d670f5d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba170c20576de417899fc929d9d04066855040a5c8d7b103ad7cecb01b6ece2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53f00ea9129727641b06e225f7482db6686a27dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c32eaa2d01c9619f69b2bc89253acd084b920487bb83d8ae760b924b305f838 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e904df7d95f691071df1e72540428e7ca93a1a7d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b83ce32800339344f6fd577efb423bf81621a00c4d7352cee0951a7277d1b6b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2be1d00d4d0a1fd31aeb65346657bfdbeb230cc0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e16753b069e87ca1b70b26d880dc8b0ac61c3d5ab9496ffd8798c6251bcc02cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14b81db2431dd0956fcadcfb293bd9c4cd39414f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1b9f41c196afed21e4507458b005e3efd73f5306299e9c41385451ca126743 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..16b13f8a89b8ec63917a9875bb57fcee9dafd696 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9e965af4d501017c1a0a078f9736f1321ef47fd78c0ed6c3f80667c028e04f4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4fe56cc681abd5a3527ebb5317c50eb248c86e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:557703fd8f495b309a79f3b8bbfa7ca60954f0c022db5967780a21cc9b8b3468 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..02662bde13cbe8790d30cb5c743ef8f4420f5607 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de5ee536be2119057b37ed2b11544db49ddaf4949ab35071fa7427c86b2535c3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..add31f9e89b25c743d1a96b0293fa4bf49cabdec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e8494d2fb78b9b76d261c74b0ccc009211b158807df5941e44590c72ff6eb7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..15f7be1d320acadea422b80e21b9f70cc9f7f4eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7ea17a6f248766e47fb26596682d73aa7572f172cd965a76cb6bfc75c7f677 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f416aca8c958bab47232784b59f4ea7960e0bd5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a91dd4b5faf1808957f6896f1149f314f52e5cbde985bf3bc2314ecfe75eeda8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6e83cebcd6c734ef8289e8fad88573664a1bfd4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58f377d154e0c540137fea3652a379e3ff096922c3f67830035814132a2e2ca4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86e4f5edf839e769c308ba5796861ba8439b534d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4303fc88d2823f020ab4bb455a779f711e8bc03ddd1550fe8abc1aba98023b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92a27cc9ea71014359e744bb5353d23b77920b59 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f18dcba6527c44db1f1c72e698395e5506a50777c69e75e499d050f2b6a17da5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6024f29d986e21c323f903195eec2d59cfea8074 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:976f33c343e0139a1ddcddb3dd7bcc819efb1be478756aba5b5d6422f7dcc29c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0aae059849caebc5fb91e5d3bef93f18144eb457 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02132fe774b946cda144115d716035384a72b7a2ede65ba6b8011b4398f00c5f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4626ba7566be39419ac85381abbec8fa12390906 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e4cda3f268046b7ddeb5d3d88f145795a7d7b74e7737b174db0be5b1b55546f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5051b196c898057087804220c298ec660b1180b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6510a1c8a7f71255bd9dae03f28eb19139ef5e12b0bd7d615130859caa9aa8b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47f8f66a02cd335cf057341c3b96fe82f865fc6f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0824bda60913d810ddc89aa3de1079b28954bfc08a3238ffa490a680c022546c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fe763d7cbcb09e39a0ec49d96daa91a9ea815a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bcefb13426357799e21b23fc20f506b4a55f225a523aefc6dc030724df8f8ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f8038d7580248927e524ed93c8f1a8f2777ab18 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3017847773246fecc7369f0f6cbc95a2b348ee4ef9637a7d1dfb943969c8139 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75e53c9eddb47ecbc3205e4209842b336dfeade4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57fdea5fc495dad107a824422261b6c2013cc944c64d7759a11085e9aba96618 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57f43ae3c23b898707c66e0cd82456b7bd7f8c6d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dee8f2aff2bd50527ddc2549e1e2613b970747423943de89f46fa7b089fd0d06 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7097218fd4835f581bf0245f2f4db23a781e79b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a20d4203ef61213137f9ee2ec2104f7b99344cebed5372dab425c959c96281f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5d4c130d899d0af51f141be2acef5bcc291de2b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d30eb65fa3dae9821d506a44b2a7dc7d81e036e4a43147fe70c1deeacbf2722 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c8e774ffec72a289c9584bd201d498157d60712 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d32636385b773e83c319b5edc92b42738431db656cea5463b1269177815b652d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95f1fb01efbb53d46de94fb2d75bad87483adf7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b36a5964b236f750103a955f40430da798b2e967dbc3e40c44eb6350ce7f929 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5842ea3483918ed46425548854c45dc4af898c42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:255abb33573a1ed66afbe3fcb63710a395fdcd32bffa4293065ea4c083d90ac5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eb34b3670aeff5928d5e6fe8cff5f13c5b8c802 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68f087225abf9046f276d87b7271935a46bf56a24f6a1d9df566c187a8bcf285 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1caa8299fe40eb37556060989666eb59901332d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaa6336149a8fe2a06f27994343fd8feaeeea53dd4cf1cd30f190d91460a1b9f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ca09ef545c024a829100e0cc9d6ef5f43a2f2c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9df782d6d73001a84f7367f7eacd8b54494ddd3b7742200f060151a99bf707fe +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e5f1b767e32ccd436c5580ecc0ecceb605b11f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:697163d4bf5de73789640d0b7efbfd01e63c8efad4000e59d29a8be6a9fd1075 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..127c83bcb109227a99228d0f3cb0403c5a8c3069 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d8fbe13dac4acb6f3d85ca710fd61f0545513424a3093a7db65c81a75315bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79b56e2cd7b7e3bb5f16a2909b474ab3303b8ddd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e5e23388d052a10e11879bab4d06a6ecf8905fd10bea602ef9616c7a47d93ff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28c0f3a94335e49a808ac3f0b967032c89b6b0a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04c137e781c7049f6f075317716dfeaea1409c321d390581abb91ae76f83375a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6746a69cb866589cd0d565fc0f344e619408f3a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f760cb357ca4bba8c92bc1b3965fc968676a9b10f6dbbbbe5b77ee64378b3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31ff601f51aabec07b115ea026b8e107862f1f2a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97aef98b848f17010f2a2ae5b3e9e0812d29e757ef64ca1a5ac85be1b4681694 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0245996553f64df5938a8bcb04abd85ba9b82f42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b914108ac81b02cad2512d880bc9e68d823c735bf6a1d769a32d72070a4b378a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73a1ce081e6c0129f5a5cbf78d2bc1f7c8c304f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf508f7e1bcf6e6b926375740e0b1d62429dbd483435978bdb8fdbe93c9f79e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..45a19b3dfd77e10611fbc14bfe04c6d32910bb52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:887b1a53c6a47f23abdd7e572113d5a72347e6fcbc41a74862c15dd05799bd89 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..034adb8159b1e3b29531e31bcfda88f34a05bbe0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e4c2746e035a875f809521cc152752bcf2d879d8551b7836421a96bf92383a3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..39d1d3a8adcd5f570d6da38a708f897ed728d708 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2274913e9ebc6d7348ec1bbb9674f9c14b7112f88bccd400a144b9892ccdf010 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77803b78e82721e7b40ea170a7103c8ca9c1f4f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e059ce5ea658f80ac812a0c9e330395f60476ec99a5a6faea38d074a6106359f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33b549c9c7058e61b67b60d485efcac02f044835 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f7b4803a890eb5581483f91f3b7e12e608078146ed8c0887dcad1b9b5fc4e88 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5147a376d03ff12b6c9a20265283f46afa6fcdd3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c61e364c88a5fe537a834f6285ffa0207ad6b76fe1ac1b589cd7d7f8da5f3427 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e900bedaf7f0bc4e6653b9137643e5a833f4659 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:124472b6e678c2be56714ae0f69e2a9a3c8938b0f9797c06b86aa7d7117b36d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13db740b7749514ecdbc7bca0559fc45c1303897 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac850ce4cad673ba1ce62a21a27d6e21317c10cb56be099c0aa08d03447f14ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f4533e1ac551f2ad8bf12c27e5e9f162f813a7a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b79b6c65cce87f89c495ac46e26cbdf56b005c1127def50ea887bd39cf1f7cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8bc037228ec42df4503712bc632fae87cff88f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca1488b1491b75e13f362b3abe198ca3affd9305a4eddf554bdaa03cb50647f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddf3a13b8fb866e6c62a55076c9715f217ec4a74 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d0fbc7a8eb5f2c82d44711b0b2e8ebfbeb90ece95ebce287d3015e8015b2689 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fdaf49f3788d7b0da70add1e055a18e67a239c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb3446a4e086a4aae58732796a04589c3a6a3c7a582488e16eeafec76e52f302 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dab18057a21f14b3d7bed11abf12e7e9840fdb7d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51b3f5b90f745dd10ec840346640090ba6705ff3a20a0382c014053e28e1ef50 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8578fbb3f84e56e88671f982bdff1c314e98afe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e90cfcb4989f93f89a47e2e4f55942f605267dce9fcbac57a41d9846e84f0005 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb75d89124badc2089891ab7a34a23672a3ad0a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:141d5031e41b66454096a2ce3cc40c8f7e49a67c422ccda18ab120599b11588f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cc83574aa1945f5ee6782d6643b1870daa48ada --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1f3ae08e86e899eb22f0e5f96da6e1d9f51366fa7ffc71e2484b66ff26177e3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..896c74497134dc4c6cce0bb296d09fc971ee2ec6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48596e0df9e517707da86edcec7d7b7cf23ada07d81fbeca2bde5b313f51761a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8578f867250820d5ea950cc526e9f927a82b742 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02a62747ad7566ecf864d488867767c239e51f6dd9e73fc37ab2eeb1b9c63ab4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae9ff5ad725105d8f17767c68f2aeff2f4eaf846 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6982ca69c22bdc81227dbd2d62f9f3e298c1aff5c9b750c7d5558bc837960fbf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99fed3c2b5cf873cd7e711fb44ef3556f8240239 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef48366482413bbef273e65162556026a1261cf999ef424f43a8e6411b393ee1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0f1085cdc97a55f411426a04614c8282eec8d44 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:421720f46fef13cc5731d2883809eb795845e3156b64d7e4e31131188774538d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e180832b33659b398e33df61ab8fb8c107a38b1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57e21da651ecd2c1650498dfb0d6895b6e108a29df02d7cdea10c202cc83f4df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..47e1f440d56e4e0f2f59e33ae365e69487651d8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2798ff73cf33b278f0f9791b6ef6be12fd30a062b821e7e33aa9e269ee31d17 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a16dbd33682a1b249d075d4f1a41358ccd9a867 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ac0c59d7d32e5fa95da852b3667f81de00516f77a50239593d73c98638af5c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c56605d743d1bd521adcd9c9225a0a9d72903e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42580cf77929fc2a9db600cc42404ca6df74299be9385c44129ba9a4afe377ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdc07d51eaa8040c374447db8ec5352e807bedb6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88fc9cc2fdb5b8bc835605bed2f30e188182744473e833b5c023ba84db65701f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5179f00d1689274e61a6ef59d9c361fef68a6b21 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d111557929f783128809174220252e8b8fa04c44a436e2e6d2884c7314316e62 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bce076537a22f52099fc1daed5f2a7c4b4b76ea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a723673d123816f385c6a75323e8a9c999a7ac535c9abd48fedf33c5a2590821 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4216dbbd3d551be97aac5921355e7991c48a7694 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70655e1fcd978d281a483327f605315725b54e282c974c50c144595fbb695dbe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55d0869f774fcfa3c20276d4951af87d89a7fdba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c821ba7b945d07c4c92622afaebf8548932662fe769fac3bc008b0566804cfc3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aace41641683ad3076e348f7b770936713f0dea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d6d2e3c49c154fa1e5ecda7cbbebb1ce03046dd93e5b9abd733b93b3c05dbff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1fd9f4c0daa5ec00726bc04cc60bee39dba15a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0e06cc6fd77431cda831d3e1110619b9a8ae6e0f92ff3dd5f875135027f4875 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..78f029bfeb814a3c386a35e3f4b6886113a1a35c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcc66794613d0755f863ca0f871d0ff957b4257933abcf1c214e5b158cfd595d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d8985e0b5a2e2fd57fe412b16199a5199a794fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30b24ce9f6b40bc8bd9221705792fb6fd92af9e625080012c1bf3a3e6c5822ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..47780086213fa156388922f6689f38a7ba9586f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7814fa584313c9689aae254f2b9dc102cb88c6726d65fd628af2e716785180b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f430f6ecfd358d6a072cec154273fafc84700214 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26dbb034802c3f191646864c9bc3a178be9c9ef445f007294d377476b0f83a99 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07793c0d2b68c8dd8c7319181fb2436501d47cfc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c0c0571dc0c49b587d8fb5f8b951ab54522590302e9b6899da2d48469b7c12 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa6c412fdaf824bb28a5fc3c8768c49e0ec664e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1296fda13ec707fd8321a14bf20d1a9246107183913b3ba7b2ebabdad30cc025 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffd75cb3c2673d2bec3c6c6210aac85ae3a205d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c494b70bfe957d08167b292028bcebac1c1aa24738f99d3f631146249576d5e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1fc81b734eec5b7d2051cba6bbf5997ffc2f459 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3470b9e6debc3a5f560f41c66d10cdb861ab40e1a8de0fb55f408f26da9bbac5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1862b9924bb04a05abc03bc2a05b0053d76d856b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3eeeacf9e0dc4ab0c25625d1d2a9390fd5375bd77b8ed22eeff19bfdc66aa00 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00323e4f3dcc0f8868ff80f7e8f6caebe5b9e240 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:880735de278126981eeb064d50ba2817c16e8194349300474052fd9b688de83e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7254d5f572fbc5e0a58b3760f08886f4ce72adf3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5d739f79ef1509960a87b8078d955dfd2b751d624bb3058de6814c817298c30 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..819a95aa19bf97c3b6cade5b7a50bb52fcdcd10f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9220a8e3142933a1bf13f25ccff5fe98dafec6664e477090c61e5b6c6d0495f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8525616a23870f9da65d59e20b4b8c5dedd28218 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513584ae6306bba4ff7502b6df5dbdb0ae4635a51aba35474b8032a36799101e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c14758e00e34e3cfbea5b23c5f7884835030735b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164f93f5919ffbf9c89f30fc000748debc0cc6588da11574f218959ef39ca8f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1913c07feeb214112f176634a54466d6f2194088 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5dd623c7319789bb7d8cd8e8ed4e98bd93e07ef8085f33c3bb59487f64b3fd5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3a86b895f2f5aa983edbf7fb0fb5bec902bbd84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b38f5f3cd3b6775d801fffb8a88df94d7151132dc72503f5761af63bade634f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..19685980332311ac9296cdae338ced001ed11132 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee583f886059e50ed3881959709553693ad7e236f14bc83bdbb2e77f12fbed4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3367ad6b3e026ef446416b66234fcb1a3d8a50a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b138afaf27d018a5251e24b87cff1f9b3fdc5d2522572c792e5914bd20f843b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dd3e53e9d2c69871ea5fa539eac71d6b533c7fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98a00e9c661595143f8abd6412a4c204301b3519ecf5e3e46a8eda51e5357912 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8f0c7e6aab0c619562286c986604c5d16c2334d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5f4a611353df4dfef54b028bc28eb6b767345d3ac2ab9adadb65cf7a78ab4ea +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4774077cfbe8b25b9a8c046fe786cdd641fca42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27dac2e386db12d2dc273ce368e46138a2c86581391673b6aa549f8f68d3b491 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07b8e7f2a7cd87511785efa563227cb021f6e724 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c476d961c2be552d204cd4f98741c17c6edb87c2058d9fb08cc2ae504736cb34 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..696f86c72d6171f04bd5b4a9bbd923ca85898a60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0cfe731bc339d970d324fc1017a67e8dec2f857fe18ab54982a3ec57b277682 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccd96f0078e697e98dc40ed04730e89eb5e51873 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad161ac549e986b462b735a3db9fcc03ff83fb65c9d3ced2e42e8b402b49cdc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c43a2521d92d37cc11d3bc6cdca86bcc76db774 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c80333e81f5b0518fa2a86e68f8cb6241263efab79ea442de44272d2a28e13 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cc8ba48c02fc1cc5c51909a9b1e8099b9a83afa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3950ed097ddaad9a1de8fd0894b19ae50a3f8b158b978982b82ad39ba1b037a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c99f2a1e3e1b9be0167c0252aa4dee6e2f4b805 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cd66062c992ba83dbcdddcde696f31d888401645cc900a9785cc40f18665a18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f9db5b7b4dbe9dcdec215ceb416fe927b9e7bbd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e901b6aae56be77442a0a3286509d9dbde57abd7de40f4f8209ddbf101e2647f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b23b237d2ae6340de9d94110e4723f0703e846d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee6b77d2e479209921861017ed3e6a1fbfef4e8b396778fb582587ce8e1389b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fad15b702a98b994500c518ca102418b46eff62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b19aea7fe82e2410aae20a5c9ffc7b85ecee0c0926d6828389a188d7c24f89 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aca5040c76527d5fd054b293df6cc68cfc33069 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99e15a76ca190ba184cd41b389b381941155832755699e97abed7c8dd1b5cd1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d0f935da08dec266b15085f9a42e3dc4fde55e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d8d29f56dceb7ec2ad0aa0853a6546b998db5e6ee07a2f82890c5de1cff31a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc50d9bb7eb5840670e2603c213d840bef47c484 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7967626d9bd848cca1aae1cc651eaa5116674f05296d3e10cb43551563aa9a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab73ca5bc006976b4acc848404cb941b6f35ce76 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3348397190d46e385e7a254e0e169b8f97d4008cefa9a0d520761298c0bf86a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..68aaeec0f20f9d39567bc367364f9fb33008ad20 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02fb174dbfbea626eca15056aed09787f58f4057ce6435001a10e4062fe96d0d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cefb84ad439d222744f2ac835fadfa4b12ca1ca2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e82a09ecaac2946b356fceec4057a8ac558cfdd5638c5b6bb936f64d11cf1f43 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fab00cae9bcbffa16d07852a799d6fa7dc2fed2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e671ec11cd6d6cafc6a404edaa490a0d7cc6601c4e780ee1e7488fedf471cc4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a40ba9d20fcb6d81a4fd5f957c4a749f81b634d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cae6c661ed7fd57eb627af619d2d86b15599c0bd0df8a28cbcc5b16704939809 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e94da46bd14a4aa26c3c946b0ab10e551ebb95ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:397f059798606a0ef672e86975f26a81ae07834c6c20dc9c77947793b5beb949 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04690c0ebb439c16e334b1da4edba7e7b79315a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61f330783b2c857f966392c4a6c41410e2ec82fd652cf00f0f1ba38a9887085e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92f31f9dc6f2646067c62188ed99b1e02e38a83a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56c4cc61ee5a56b63dd5f8d7cba3ac8e6103bee6c184ed7734ff6084ee738ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec0b0724b4df5ca3ce9233132c3defb12a30d0aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e860ab623208e272624721dc8047d57b7915479a2b2f9bda2d3d09df73045196 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92692fe2cc1c705471ef9d48206f20003b662472 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66c2864046f0dabe7c4294618c178c0eb3bb4cfc0d0f5dd8652206ec5d3e4781 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09c0aa10c5e671f9f3464f39236fad4ffb461a1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01f7774c2c77cbc28bab59222b64750cfb56716cf4b392af2e34cb4d067fb6f2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..59d78a1215d8f3c94ba87c7b9a2905164071464a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:416e6c7f5ab5ce04d796196aede6884db36ac42c283d4130cd85298f47df68a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c8a24817173dfa4fd450e82a9fd0aab4171d11d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c361edb0cc39177ed31fad38ab2eb661c7c0651f3a8d691cdd98c0d663d141d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7957fb31c9b844718db068d1046bfefa424f8dd0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ace1975e05ca33cb8cfefa60c7847882fd55bafb272e7c6f94cbee2ff4b7e87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abcc07f2356151166021a33bfd3e897b8c5edde1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:323f48eeef67a7a1d91bdf76cdce0a02ce61f455ae09d90fae3ff41aee11ab3a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..797806b59dc0e15e5fc0bd6149c829b23cce8607 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95c39059294079dc3ecce456625b2923cb49c16c594c702968310523c73cbadb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e799afe2054f1f4052bab95210d706344c36ed77 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a7632b6b18fa58c0e03d3540e142b05d228be515b991bfa16db24ab659b56eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6745f77438d81c16cfde29e5ce9dad9e7624df53 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2232bbb7bb2cfefecd95d77ce61c130b1bf9b6905fb0bd6191f331832698ea3e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ab9df276caeed98a7608a8f8595f511fd938e1f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c40482b4c305c3f703e94e64e351fd05aa89b958c245308718c661be7a78b5ca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a8a2e4c0ea163c0c6ad94616a5438c18b2268ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fd87292f5672685b8ad3e4ecdd23614424d6f5813cf5d61bc3dca087bda0347 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71f354e90f65ed4cb57a635fb2f0e7efd1525f75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4613d1e421acbd9e8edd5e99004a51d4dfbb6108e78fb0b6a74d96f445e749cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..80ed32478eaee66a32671d8c62d91385fb76dabf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55bb45d3ad6ec1a3aa5796f350ef1dada9ba9a2ff7e2945045809e27f8a3fe7f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2800bf16792ad6886a677c8c135d6f61d05ab74e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ccd42d8fc41effb807ddf8758d2e613f13094fb64b3786dbacb7a09bdb4d932 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..032d09441bf90aaf782704f8f71f7da2ea97fe06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d0a6ecfec44100907f761babd80674a43047098eec65aff7cd962eca04b977d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6bb69ff41585ae419001d2690873b34bafc542f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b73750f0e39e50d9bc64ea325b3790b2eb352d00b2199f49b02517a912369d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..05777288df8afddb154bcfe63d2c0798feb3dd84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7121c7c8ce1291eabdd109b3cde1f3f4a3be950834c39553617dbb3b90f30242 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8280c180b8d7fa2e9c6799b2c893642eb612f591 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e1528ddd83f9689237b7d5461ee61f5d5b10eafca10cc8ef4396df19bb51a59 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..efc166b82831bb7875c954453c62abd605017e78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:582f936e7e06d3161b4ddb9d030d20258d32a08f24e067f0c41f8ebfd6bc8a4a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8205993a5e4e96eb3fdff8bca301077d4ba9bf0d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7390a866e45e0c7f7b3c16fd424e18d6b99e2fe9c4c5e2fe4f19e898e5777e31 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1b7bc965ddf91630bb6e65e855fa8af8137d6b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4780575526cbdadee8c039a6dad8a7850153e4242851eb717540b9d63631ae8a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8653b7d81a79c7444d8a23769403305550b73569 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a52d825cec66e9c96dd77a20f67f16afd5a51ac075d8b86c4a1806c8b49133ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..510d0bf8b58ebdbd242d5b6b052d5812c1c2959a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:117bc54aa291847a0e3e8b8aa042738bd3ae21bfd52a7cb7d7c9f3f0b2d526d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bebc81489a3f600019436799705aeac8900a6e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d0a1aa5e9efa71123168c9a1f5545942664bd5b8a97a3a3b33a827a80a3ab89 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cca97a8588b543922e158fe0f5408b783831040 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca2d73fde87d6fc32b042175f8972c6f5810c1864b75876c92aa3d23696d2d35 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd6bbe4e5531f81874c0d9dd43718fcb7bd25506 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1989733fe3a200f40348fc7d6bc9ade737c714d4a30ab1269b96374979ee1ed6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30334c0c03d612af15de763f7d1f17b2b052cb6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4bb5752d5dd9b33232546ba7839cee5e7eb6767e87cde167a10de6c08ec050b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87a5f7134ba6bf40c3e2a68aa9a261b39f116a55 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb849ad50c984933dcea5637697f95bcedf1cb603f3113a8c98eb35328c34f07 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d16f19f9600f4d81015209928fb02c48c220d87 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cebcb16c194dd0a6ce318c75eb5dd9b132ef2c771316a61740a7e85d1d9dbb31 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b03683f8047393631e0ca149e41e7d210177020a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464a5a588c67c349087a80559483165818161f1d9474c98b1b016a132480a761 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11ee6f64cad896ebe3223ce35c7f0bb0c3a58bc9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a988334f8fc478b25a3d0f18232a348558b3015790f571494903b7fbab9f4fbb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98b04babea1d735d50743959e9e7b6f640ce33cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:466d4feff2bf2cbbfd1fbfac10a569e5aec2d56734b83e944fad14dfeb000056 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75f5877e6eead0f4538782a694cb743f54d3329d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e5c1774469fd7ea659db9015b21794f8cbbcb5b33b7d33a111eea9bec431b6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1907c9d94441573b0c917dce6a408c6ab613a6c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1440f94e889004ecdbc97c691bab5e34d242ab11505b02c8bbbfed3dc17d43cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4025175f9209fdb8f9444289b53b712df775a5a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32363de39e3b463f1f886217cf54de6937b93222895f50f9ae20149ed6200223 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa00bac895fd2e3863da755299e54af4b87b6750 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ff3654d3cd36b4b0db721229a7d7375c117c1e9b7d2e6caf649acba10742674 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7479c3c32e15731157c4093d6cffdf035d507936 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd342f53e1c4962cc8437e7f448bd2135c197f7433631bc2e9057c10d196a03 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54dee3c11f470e73f5068f5543e54e4eae504586 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dfc427524b0b250655ed5f12ee4cc90f8ba57d1d47e0910f7fd18328f51c334 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..450820c06a3301bafe4d15d3b00e0feea048e629 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af29a25fa12a70719a8b4d45319da8a2a3fbf57bbd5ffc01c20f7a1a3fae10d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f41a20c68cc1b439051810b360c14414d6707a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6509bd30ad02c1ce5a1c3b860c93cd1fb65b6cfb201eaee7ccc537f230efbda4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df6f28275edc97627bc33d5ec8c81a55417d9988 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bde192c47f169d41bddc7e8e14dc66b3e5841ceceb3f45e828876394676b0aa0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53073a3fe6248662682d4c1444755d4bde0de8c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2b355af01d678414854a1a4e6d99edf455ccc5d474c463511b0b95289aa4fee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40d7af1b7e464d4d206a315188ac4d6e8bd75260 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7524d1730a0b0dc1b4dfe00639407d922b94ba367c2f72fc19260f75ee80bba6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1098dc0fe694b389e3b2a2255b2353a6503c2d97 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e811bbe181ade7c62617ada4aa8742d319221816fbc2f2e5cfcb0c1bbd2b6dc2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a30db61ce2b022cf8d820362d18262d8c294f077 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a4877e18fcfa90facb4222101118ccc2627874a59e4222b9b97e9b351a2040 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c29c243e269156e746cbbb8966f436c63d86bca7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd43620c0eaf0d9d9d74bff4732a400e8e3137eb74c845a40f0d97319c2e81b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd3c2c316f35b210a8a8a6d05141b02e3571ee31 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c8a940461f4bbed02d8ec293fb730c314985ed20c0ac4c541f6ce47d89a876f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18d1f4c17e5dcea09d3af4e3d09b11689975abd3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27b034444e486efff886514f8f827754659aea9b4a6d912fe38ae0815b751a6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7d305012ddfca6d1c68dc3fecc7286dcc42ed41 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5d033e90c08fe4c6c28ab060050bb048d1c0d5ba78e80807a53dfd72e2a03bd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e640995ed25988282caefb109d59a161ec5b8344 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d13f9a2ce12e0cc514f498bef3e2a27488102db68085191b0af095e0297eb04 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfa4febf3b35d4f788fb87a4ef183fe91cedd4f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca664a31488652d4a30a9532376c5a5e93077a39d316b1c1153dc98bb636ecf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cebd00cdaceb5699d934a20d1fff84499435171 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:642da9b13b246db25c3906f06868f5dd28c681571ad8def1ae60466d1605a62a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc036f7ef2e98763605ae886d6256e1167292e00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77cbe903941bed4e8ba86e43e5ea5eac83628ec8cd9216619bed3c3eb54fa9f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7054a883ab9250c64ec5c233d71883aa7bf47d9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28999c4a4ffb9109aaaf8d91d1ab770462106b9c25c858310c5a66762c4629f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..722cb4165e59f554a0c65e132a903977d821ec73 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2008e25540a2c9e8593a5763d56b5b1be2b763d2162bd5baaef81b825a609a84 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55b582b082bc57ebab42e435366be202ff9499e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97799055de40a0464cab6b7ed63f820692ad923e9ebb1985c3e2093b40abf21b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d1c564fcdebe165846ea48f393c86a3f481c20d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0720271fdda1b2fa7c7f39047945e46e9345631d549e29d4e8ba2518a75ae7e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c3cd921a2aa2e21744dc8dc95c968bee9acb704 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c795fc74ca3012e926489b5c462af28c0e549c9a441bcc2eb785184858b0165 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b1f482cbe258897464380f00429bddfe801c828 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a1c7c7dafbc7a2d9b7c8108fb144f533fbf2ee3889edd0815f2cbb5227ecf76 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..afffb9568ed0bf879f2ece13be415d800f870479 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2686e98649195a304a56f9c1f2fa2a89373eb8c92566eb2baab77fd4343e464 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd922581f92b64a7aa91925681f32173fc48a06f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c8ee0ed76dcacef00c7903b86c9686f47ac9954f2c4ab02086fefbdafd65527 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2567edf062621a0aabe9cde3dc5c9b8f55d2e34 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96c5795ae41ef601772e3ece16f679928ca51aae4adf273a8d51cc3da654faa9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a35f5371bd7b3895596a39e886036eba1c8c651 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a1d2ec09eecfac88e280e69fe85300ccb71a13ef63535583ee7231d7fd83cf8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b63a2ae4b83de82556794579d20229bfb57f03db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b85a550531dfadb274f1bdcb2c8f03715367742826752a8d8e3fa44144126758 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dc0794206b003003d9a027790aaac1c567d8300 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0244c798ad453b36a84e07b9acada0f3752840646d4fcb1eaf73e6ce656ef19b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c158c7e797af2c02ac88bf349d09064921c3dec8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0acef08e1f2fd69c399d2595b9e8085bdf2c3aec9965b0089299fb772db9472 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a5ea029a534a4addba250d1246596017eb302b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c6575246d7ed0d61a62661eba18efa6b289585a6eda0acfc76bb3df1e752e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1feb0b8627b6900e03104fdc116cadf78d4058c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:260dcff4f9af2fb1d804fbdd20e4855de4577f145324c267e07ae93af3256d32 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..26ff3b6f06bd31b8b51f64eeaae3d762d30d5e07 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4487ff09f69c1b4eba87e88142bfaa674c41eea9f44c2be5dc7d6ac30663c985 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76c753cbb8ec5a656794c81cdef7763d9e91edab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c9bd250bfe10c99ec5a7c7b113ce2173a8f03bf54259503022512728a41fa7b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..10cb2764d84b1e48b02b672f87dd1530d7989dcc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:034a1c4ca92c4904695cf7925663bac3c277f4fc26cab3686c34e918f1ed467b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5afca108a992fc4c5fc2de987d84fbe53cf09fcd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c80d1de6698a73645ac0c1607e0eaea974c75d129b7440b666d2c1f86c8c3605 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a95cc6f3c3e38e34e16b3d50d7528155ef92fbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d91eaac57710c454dc5dc5e3c6651852a16acd952f4aa4b984c55e66ef83ac1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4eeb2e5090239a45be08c87fabe3a6df3069a1b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11bb23e8245d23c01a7d750257712fd737b28405f84001f8a8281a22b99b39b6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea3f4fa58494f81c98d514ce75f6c03e4d977139 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59a3e6c1293d939c0b6d9632db4d5d18a9cf5c544fa51e7b332d9c5496216ff5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af8b723ed2efffcd55290c49069a00c4fcb10ebe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa45ec287963ef413712df7dbe5af05e3b9ce3004670cc543cc052b102649e04 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55f2be7a2a7e53f44d81c1143179c985b5f7bd52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a273b608e380523a94c8be954b82822c5b8619193a4b91b839fa50b948b6989 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33b5559369bd722cecc606e88ef8465275d115e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51b74f7ad794ccc0866542d326bca2ae721e531a69f046e1ee4ec91f49e62e4a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3074df8d44ccb53aac9b6ca2733259da8c95df6a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4cb7da3ef930ca991b13e9bfae77a0cb02cc8bb3c735ce96e04a373688db36c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f1694f75679fa5e01c62d377fb1bb080d0e354d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5de1cda701fa6b6e99794796f14b27a77d36ea54b29a9ebae7e8d73e93bde362 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..61a047e57ca64d156b0f4e1e11a1135a9b41c107 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b858724504338f24839d1867fb96e179576e8e6b86d814d2eac22bf58e0a00d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eae5563bc10a83d83a16a69ad19de5155b531e12 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ff7f272ee6f35b1ab55f6abf15302d741ad44d6ae48cb768bde1d0ab83f449 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c425e5e5d96088e04b89e5dd62b0e45c566edeb0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6b33e88c9f5c79fe49dd5a7aa9cccf0a2c2574391b3c1be354cf3a3c57cfed6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fae3c17df42afaa1d2ba3fb26e3d30114140462c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06bca8b2799a81a180785f7ee25d5d5825461ed5cde6ff75b3d02db3cce6bd09 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ef77b00585db40753d41d074d70c342bff80c9e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:779296f0c2e8a9d0af87e73acc33b24ab9a0dac87ff592adf68668ba1ca7a49e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..457dffc3fcecd37a0f5d74c1db518eca20e5e821 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56475e8da9cfa7cb9ece3f2721feb8e6993ea8240c39906b042615a55da86d77 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d70114b443b13493adf6cbd2a5feb20353a020d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f5e146ea251c2ec99cb0a8ac720b19bd378db2b7a4e9937ba6fb03318de5e16 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecc302765bf8ec720b57f51ce8558f6b643ccd87 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87215968e8502ed1d6d875fb518b45cb81288a696d4f2a338405da5b59466da9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50bd2bfc6d91c8df3b7fa41c7fa07755fb272e8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:817af95e54435626068e002c07a36e203084861cd2cde7f5ba06a982b1255ada +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e86d3edd66216e9ad6f0ac9ac1da6b97ac60957b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd0902350fb3d0e68184c0c617b7c431d2185c5b2b591eb34a5b0e24c23a5ede +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d394c647d07c7d647cbc500aca931a582bd5ca3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:842aa9fac78276046e5d1d7a719e0783cb4fab468998f46f78ce6585c09889b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fbf297c080e4601e374aea4f31d20feae38d4f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b34cfb515b646f84cb65084227b62fa81221614a246cc7bd796967bde3553fbe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..558238b4ff9aa7d52d36daee1f340b74d14ce737 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4820213d2fc51f78b7b0b15b0b9479d868b9125150e22d096b6e1c606480556c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3bf45fdd60bbb19d24f40e696a8c1c96cd4f713 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c1d587e8ec8739104ceee684a0e6fb63f0b7b82febfe0fe747828593e2cedfa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e96a9b35b1198f5fdb7102b72c45da225473d784 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3448f95e3ce86b5c9a8173231de325e2faeff7534e9d462edb2acab30e079a13 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b0c68f8e899607722108d99ec51b50989e35fb6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b22c761b2872a0db1aad20e6552150d0995355b25744ce1d13440c6dfa38a4b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..adc1e5e68011ba40f71e6cee6eccc26c010dda9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df74eba54a83ba24ba8ad442b1cb69c489e6a702e24c134f736e6a296aba5cc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf4137e8d3254e6f797953e651183e577f9fc371 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:915927215a32718f9d8d023bbf4ae92e627b97b1a798b800ef5a1eca98db78c1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92de655021ede549983f347c5bc6fb4ddd102830 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087903a2dddd9166f99e25782ef47de28f78099cd05aa894aaf3a5cdaeb6ab80 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ae5b4b56d0aa7d69a47e69d6b90ddfea9e35fac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baf4c21c83586d10deeb816e585b7b425cc0c1ceaaae4ae6f84ec87a5b2f839c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f27bd52ec634f8d82fa9fa2c4af0c0fa3313b137 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a561858ee241283521546fd054db47c70796e3869572cfe5fafdcd3187acab4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a65183d90dfd7f68886bd550ab6c814cd4160c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74c1b607454533cc67a01cac790c3aac5c232dfc394c917ec7209b9eb1014f47 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8b7f2f24dcc39c14e1adbd86a763aaff813f9af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d471d583c069fe6fb90a1b7a941d886cfa54dd954009cd121dea021b581c8d0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8fe785ff35fb84547e106d2044234d6db009d70 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aadc0bbb62de0899cb7c8f0a347f0fcbadc85ed15cae916fbe82279dc00b92df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a9cc1819832491087783108402d3f0333748a25 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a0008a25a13af56e90e4afdb95d40f9b156c8fad9572135da533be584d614f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a093825656f84a88332ae9ad26711f87a35ec200 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7bfad2cf2125f0c539cfbaf897bc9277742d0c48d0cfe4ca9876f8d091d1046 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b0666f0f3e8ae79b1c417ea7022feb6a864cec3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:534d0faec5c23c8d6c335bd6ff36886307f6eb84489989d34c3c88919a823bd5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0ccdb398dce212f265c618306e15d627bb767dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81a482f0740a63483a1259046f6788645c87dbd281462272cac24db1e9a007c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df51f2af8badf3decef0ea17e627e59a0e2a9cb9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a182430dcc7956a5b8ad3b8c7bd600926d134bdc1716e959238a1596d5ecbfe +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d41d59ec1f2390ed74ce792d3533220390e75a0c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d087fa3a88a66aefa6cf6261f2f50d82eba41627b89232c518672432ab7e9dd2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..870a969b550599fdf3e1fadaee58691d03b8f78c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8026d01eeab606e9e597196e7fa6137bb17d24a504bd3b328240bbfc9fdb9fcd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..858b58c4c1e40865d2b84e98d274f85edb4b36fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49f054dc672ed46ae8b5b4edfed40a01a01e2e5007f9100406a668db42e4913b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e71ffb83b5edadaeb2e6822a5eaf581a5884061c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:383a58cd257c55a7db763fd4ce3fb4829a09bf59f1591926df8af576311c89dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c234369d4f4de81cdf974e0d7a9fd01132ca8d39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bd49b20ec4a7763069220eb3f0eb4e786bbb1a272a81d010329a59f0332fccc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..898772c4ff57e1c0809f631e39e4a63e80f5e1b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:008fcccded98865c3098b10805c29ef53aca59ed474c706e7ee63cb1dfca775d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c8cd281a20bba96da4909b3f7290cc5d678784e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b369ccb4d737cd668383ae4b32eeabe4a5892a90bf70a531b9cd2bf81a21bb09 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cc7809995b50294b2def1d312f1f00f4688adff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b9e6251c5f983f689847e0498a98ef34bf826140a40a0f48e2dfce11e9e6cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c496400eae396c924d89690339aa9b0cf33d239 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feceb4c5365c686da2a85e5ae9e26324872d43c64f1be07b5279a5a330216ba8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdb0e6f95e213c70c86d0d3a7cafe75649f60b5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:149f817938602543e0b276ea5d223c6dd03c9c33a56f3cf025a7a347cfd2da4e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6414b60f10ee3ca72f09312618c63fdc48307823 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d211aa94bf899d6418143300e40c306e8eb74e8325f5c9a37fc03db1aecfe4c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f2f9afbccf52c00c0f137d309d9585b6109fea3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beee581a449cc71075909723065fe9d2972fe722566fa2a4bf18749c720e46c0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea59fb387bc5898dfb0a49d24ef134dfc1951121 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7072f4410601c30221bc0c3e4dbf63963354ba0c2b619e0cf2370e0e8e66e73 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fd3615d72416b2b077df1280f9fd30a7c23ec4e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ba5bd720eb7a975532943e37eca27a0c83133a7e00afaa1ba6a4d032f0d14b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7975031db4d9b84ef446b52908ff2436ecd72c1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:088e731062968b16c34d809230d844f6f58dc819a4b3bdd8c239cdd26ecfc001 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bb74d1425081f5303737743328a07a1516744ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:770cc5f52fea3ed36b81d14970dcb1820049709ec0ac4ed2f85b55c878ad9546 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c0a30ba812466c6c4e46f6b63946f38d0abc354 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e68536d70c754a6b6f0109f8a3e237e8e00e8abe92556cbdcf3d09934436c3b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..821b238d85453d46b4e31f5823f4751493a92d74 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dff32802dda0d748730e897f227e27d4fd8bccd6a838e12163b49e9420e10bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5dd4b57e916765c204c9c4b0f15a7bace553bf7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa574f638c5a7ad68b825229f45baf68527ac53bb67425b3767ce1322b257582 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..389a2a958e9a864ed1d5255047dece803d3f3dc5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4768a8371ae81a565d5fc02e193912348afb79227abeafd22a80ac6ae2013652 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e148b53b0779b5f4252e72e34a4a4ed01dc90356 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ab9c03916706dd5d35506680df49ec69a23280e82e93b113856b3a0f5b4a91d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0aac630ca8ce6aa1d7e487f6b270acd48415364c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb21b54dd37fdedb945f41e2398f965c4a24ac942def26a871157bca032080a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97ed60e1e27f18d95d9649c4e7010b82b8f17353 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e8f7addf52fd0f27c38704ab1e4e7628e571501e9ab6e2f831ead4e036a5bf5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d012e1adc9aa9b223c9420dd068fa37d940a8a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11e531b3a514806365ffa138c7f6d4458ddc1a0c891d4f1ec48e01f03808f38 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59620ec33379a190576de7d7696593dd7afc0d86 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c01dd929dc2e03a5c76118777bc989003626b3c4118c660a2ae9f380ef29bd7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ec2358a4afb3b249275b5efdff219b8f68cbb26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c56877aad1d003af64df5790e4595b28e7d4a33e88df64fc3314ca985a8f4e2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b63a423e623423cf1f7791b8717e809223f288a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5707f11fbac0a1ad65ee133b412a0fe05b4b4bd25615902f5d0c8f4f315b054f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b945683fb0f49632441cdb35822dd4e39650b4c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62dfb83c8e629ad804a41e06330e285673ddb6aa1d4cb505f79f26e765720818 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57bcd141845a91d01e6a6e10a72311d5837b0b29 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:350c9c027f378f0868fd09fa2d4f3146a7ac90dc8357556590ae9a913ce13458 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a9e1ab1b2f61768f1f5c5461e768ed5d6ff3ef9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d2cf71e1ad82cb44be4dc389cb0e301acbc924a51e455f8784595db6c7faf2f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4597f4d833ea7e4d1ec67baf5352ea1a3c1f92cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a31bb0c6e0a2b24ac30bb552fb56d5c44a1d24a36181e79f956f098c855aa270 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e501101b7b6527913eb547625d1734c1e7e1b0b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:515c33965ad244946c82667c798e2e1659ead493a738054bed26e72d9d588f13 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4790756926a1760f61e6edd05e3b66f84603f2cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f5569b7c0397d38e29df7b692e2396e49f308cdcd8bd73b7caa568eeb8d9a74 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f797645af2f86e73fd78e54c03c4234e7cee9aa1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:671807758ec0973d4ee4ddab50915ce888554415b0508594abe2ae15bd5079b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15020cd3c8a88ad56e3467244b48b1e47a6e7a1b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a44f60031151710fb60364cc67d6bafbd99b84063717922ade97ff43ad1f814 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07a65d017a805e65c9351ea83b6009544b1119c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cc74003721740c83bf8269196dc7ebfd72f615c76ef4468eb7ae117c81fa7b3 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdfb3703dc496d6b2b2bca7dce8a343e483520d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c3ed7991c7ae30419ba06485503e6de74d567bd9ed00091c0d50ff8dc2cbcab +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..09416e5643f65ac249870ae274d376b2bf2f7dca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a3504d8957eb96d1d74888112ff8884ee67ef7827f6ab37ff17fb89ba1970b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f01fe0972178c854989897ce3c3a27fef426e3cb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a2aa28b02badd6a42af98bbc2efa8e33d1c336258acff8e0eb1bb42d1a5f262 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54e0d46654c87ec66ae36b897474ba55238662ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb2553e4a199fc3611bf6feaa64fe0b2a19d67db44a63642ead08ad64a54452e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f3ff9ce83411ac27cfbb3aaafea83bf18ade1a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be3ba7be9591a37ea5b92be1eab4007ebdaeefd87d97937ea3fa840e2a32f27 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a25b86f525e14ce2fa4227ba674471a88820dda --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcabcd15f470003780f590b6377438b6a98b5b8dbc1df1d3e8bd7b8bb0428aeb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dacbc3fb7bafcebf3eecad83e86ac909f541bf60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42acc35312d0d351dfaff54b9b4787b707757b8595845d6d4faea01d3d83dc8c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..60b6fb2fd561b6652082b1a37d748c619e2a86de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a19d8a3d266e7000708146c5dbc02c33b067d88d876b5c62280a7e966eefe84a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2d0c1f9bee6b32a2a108a667896be20154a95cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330a1b16370a34901b939f8ffa8204d6a2d91e3489d143d16db05a462ccd468e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..60f0c5d91cb9bb7db58247190a03ae873350540a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d5514fb254194968e2f1f5999fdb3fdb03119b06a44e2de7878c36b230f7f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32be6efa82d5e2f5029b4a08104c805648b47047 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e4eeab0ac128d2560c8b2ce910d58905127f55a75a716069e7c20b030fba807 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..042b715c70afbf599aa21495f48d805d9404e620 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb970f8e1adcc2ec9e4307fccb329ebb328aa3d18e5290c3c17eb4757f6060cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb9bc2867868ccf3f5099f8289b0df700ee5011f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f79423aaf03cb633f4c0a17f5ce0ac85339d72b7de9e7058edb22178843111e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f0c20345fc9cc9051d15422509515c35209bb71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08c3ce1526b7d822995f40ddc11cdc51ba6007c8ad10876f5db5c742678f096c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec0213a012ddb417ea94bd0b9e8a56b2748dc344 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d86cbbbf9db040d79c2952c404ad60245ade664d749c44de1b8f1d8c42b67ab +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f51ed9c59a7a4120bb0e9c4ccf96145d573bb0c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc6199b1b0639c5a0813c050314ff0a1bc5e3a1c2553df1799002138078904bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64dc94203e015a24859bc1ccd5cb725e9f1fe814 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc035e257d000f69d88c5baad4c475a215f82723921edfc21e5c4c57bea261f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..930fe7d5dd1ab9fbe6f33bab20ad44590bfba4d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6733dbacf04a034637ab175d1d0ad89ca3cdcd0b9fdeadd6d5f22204cf34d2d0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85ac3284f1e60caa4d0af716d695491fae6000d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af61c459935c96b016ccff850323914ca3f51bb25f1dc92f3737f93232f1c5c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd1420fc1fa2aa3c2d985b9773b7b9407163e1ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c070f9952a18fb1c8dc04b0fc89c16d8a6bcdedad16ec4325cb5fdc59871681c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12fb5bba66c445e116db97cbfcae9efe64c6aec4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96eef2057f27e088acf7fe725fb7d189a59f254c134c6c9cf0ddb5008e842324 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dcd29aa9a4d1778f85c9cbe81d18812916b162d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a1456479441ccd246bdf4aef5c7aefcf42ecb6f87ed5c615585daa9f00ff096 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d0cd73043f2d45514e12ffbc967873822d06059 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04b24a890affcafb687446e1db41fc67c1f176aac91f1168548024062640964b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de149e4d927b1d7b8adc00ee7f60ac49a529878e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02099bd14cb4cd7976c88dd33f5c4a350047f70f35c3b6ec8da2615c356219ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66157d2ae947c97f5cda5588f9b67885d0b3031d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3481a0f60360b045c7c6db5793cb47adba452e91686abc48dd2e7e1e445cf525 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5287d7cba08d4b1af7e7a726b90229a8f414ab7d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:316e94ab1ba4425964e6df7dedf14d056d7cb7c8a15d235f639621e5ca677e50 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9be958c2884d0c67897cb8f7827104cfc07721cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95c5b61fa791fea472ec094033d39d97cb1c74190f76bd53c52cd01ac8c07147 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f026eb64ba59cbf7394d83a8b71cd9207f97932 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf4051d67b6b784de969a25cff0769c71072178adff91e12fdd5f8e5e8044b0a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c8f2738260efa2b02a755dcb862ea64ac2363db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab1ee74c4f3058ad6ff04b43fd497fd4dbf35bd7d29a4e68a754c23f7f7930f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..14eb47bedff84f46cd6fed4e0ce81a6cc921daf9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15645de982f52805a46e11ea5053ba4e37eb5d5e2e7daa55265b1a8b437f513 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c78443dfd3c422e02ae6f2ed8fcc42273174473f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d827fe24cd2a354ada2088f9d3cf7e1f2944145608f61688060954482ab6405d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bcfbc049de79f780163e947f5214835f192099d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76a8f0be7c97f9c51682454e5e898d093b4dad7d3d246662bfb761fe74ca69ec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c36db2363efb39fbd7d911f6324023220372ee1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b515af27df2d6559e19c2cf82187db1b6871b78eadea882dfbe5d337eda5aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e72d5f9364209a88e0485bd8c1fa88862c68309d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:635b973f722b9bb87bbb813a06e0e023e74ab2af7210c06615371668d476d540 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5934d943da46224e1925cd64549413fb96ede7be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca4ef9cfea33b43a23e08aeb6d14f782245ee185fe00b4bae7a401e28a45dc20 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b41fabc0b8fd7801e3a5f2d1811cddba703b44bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7536328fd8a4573cb498d5c869f129f2c8025d22a2d767e5e48e80ff1652afe0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d2b3e405f311844f534ff0a18576b773646a0a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8db5b1d4bcfc696665ebdc9ecf596f4973752001bdf5eb864129178bba9fef5e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c8f669ced4d90836232d57a5f422c3a67db4203 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4b978718106b01a660b45896f689d2002291f7ea9ce83d374e8a2a0662a37f4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ad28ca2e4bb061355b19c90ac3e0d5942f0c1ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:529b87f891ce144c834a0c98d1cf018b1f75733158774b915c21b6f7bb9864f4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a71eec3dbde4488a188ceb758467a2e2bd501e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:533928dadab6171e6ddca2c615728e7fcab4c1484005adf3f63caa64f0266776 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b1ae42cb00f297bdcfc690f37adaf715aaabdc6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c8065611fb5594f867577aa6a7200a96a5fa0b85f24f9af01cbf33602751587 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdc17a1a35887bd387d7d8e8b9284442398ae886 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5785508667a0217b4eba543cad140c158f57a168d00f7e2f5eb9a0c189ced944 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29c30e7d1af14545a07f3500d1ce1604cb867fa9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f6cbdb29e8081f239cab6328f7c6accf8c1488d31f356be47bf0eac021ba599 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d60811228ae0fa80180773ff7bad9fac32ba2da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad79fa623848867a41903e52d427fc0e5d304bbe80f17bd71c7e1ed9d4ead15e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..515145c8c70a96f455d7a495e3bb17032671f2fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39a48a0fbec9d67037f8f6cb6177d307f313976cc952917495495b2113786676 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c25116398d7455236aa841d9ff7ab966f3ad2c8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f543e24cdfc87e3de3fbb46f9386f8e6795899339930d88be00e1fd1c4589054 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d176164d5e8627ddfb031498ed72d8ebcf661547 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e601e8c3cec7f8998b87a4054f9081c543f6ee37786dfb18cc71afcc5d964b6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38dc65a410671246a3b77c166466cbe4a7cfd686 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b132694e36fad3950ab47800f3db1d871f24c7eec6e0081ac343d71fc5280455 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3679126b4170b4622759b5a7637cfd68a2d07e90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f84a91239967e4191c3a0f9b1e32f79427b7fc2acbc06631887293bd31cae095 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70600475bae36d0d2df823677e751a3508282039 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16712a5fb561cc741ac9c414f5e56af43da15f22c83bd8e074984481095f6cb2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7ef939e5ba39ccad47c775515dbf2321cdb0510 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8f83b56564495c7de2d5e019d0a2b406b2f131b0fa85b011ec9f564ee2f0304 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..342019e95090c790a54dcee32a41f94681fb74f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78069189462d6a8f695f2fc8b7b0328e50d14a47f066d1fb41da8fc8b772a1bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44413d0d271887087c93ed5c5ca9a4dc22e45c8e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01f9d0c77f66ace40692791b0760fddad9103ac930236664e766713ac14e1eb2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6025a0caf8dcad2c67f1a9aefb2b44421e9233e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:194d936478e77f24d1c54f93d7bffe89eadc10a1efa137eae295617d69d74f4d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b84170cd3b0883bf422da30833601baa821a6f8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:831f93ce7b53b909cc0e103924e8e6ce8e653b547d66db62361dcf92301deeb2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5b21585eb104d55cf357a0b9828cec9b63d7d3a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfc50284c87acc232754b08b6740d38b4a09edcd90460a78b36174a2a9473617 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5837af9ba590b7fefd1d139459e861dc7134b024 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44876a84e1f4c03eaf04d827a0f20830a720ac423fe65600065275666a86f0af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e09a0750e5b391e0c406fcde94522c00a7729a5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ebe083e39a8b382b4269e8d4d86d1aa44e3dc73f00b30fe50d49549dcf1a00e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7439881405329aedc5ed3dd9c8b4b7e37c51ef4f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e6957f3f577d0d2dc5714e0222ba777f316ef4f8fc95bdce4f8856afad4051b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..577216d5180815391e11fa5e2e62c7b752166da8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baed94309ed239c8e4907eee7164c90f73c52781bebb1e754124c64620cea4f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbc60e990be2e20d06b13e25a6d31568ab0273e0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39f1a27f1f0221e0e60a3f6a92cfd6de917c9ea382d98e57d07cc25b8a267d2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70a5ecf3ed1cb7a12883822154b5b780652d34c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c5d3d8903d186bc892268044999a38117b43e7b363cf41af9b91aa1d526030b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab37ee9890aaf11e0e3448f29cb03764f9290e71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24f316da8bfbaa6125bd579576f208355eff949da14a6f6a0f3f39c33d53c1f4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..51ca1a6a00ff70450748bb73bb93aa13decaa12d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81cfd34d6fff5b581fb977cc41a8f23277d06a76d9341a4fc8360658d96711b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc65db324ec78c77a1ba8b1a5842998baf7c9125 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3754e9a562ebc38defae1ee25534490c2ed300ce04970d925db37217e2e9eb16 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1daa0b5d836271f6767db94c949549db3dfbf5d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e5631f1bfc8f6391cd389f9c584aa9ef95760613177da93ebf4bca3ee37e90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7b8785435847001e0d357ed9f881f39da931f00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d1b87597bf677dd84d5ff76948ab90ced7945db01af1b09092c9c36d711370c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53764993c9cc5394178c99a529fc1517cdc15cc1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c287c5e7c393a863cfaff7a54d5a86fcddb53c1bf368cb8d3b51ec1b9c58e9a4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c42d0b36f8f023edf88f5256bc98e44adbbfb96 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18aed3196958690831fe0ceae19e2cc18831f6edbcb24900d25e3fc1ac2f6ec9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fbc07d76461c8f5aaadf2cef70bdc375f77ff1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd3c847ec476ea90e8250a32b3cac16222412576215272d885f1ae07cfa3fa37 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6010494cdc146a7899add7395563b799a0a785d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a42a49256ba51269690cb7d926f901428167082df8848d44d0d9f2d445644bcb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b5011c380683e4d0359383c51b24fbdc660121a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3a33861f5f34e7bca7c40f558e48ea063212d2948d8573234a63a3b79c536fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..257ae8ac316604722676115c0e570907254eef0b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75dc0e6b8264f8e8e07d2892a6599a1522b01c27db362d9bdcfacaddc3db0c71 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7085decb5d9298f2f830fcc7b6e721bc5e7e6db5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0214e83282e39724e6c77716e85940de9b2080c2ca750e44d46e0094c2fde6d1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eb3414ef5ed7d5b6af38460125a6c3afaee75fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86768ab5493c05b93f8922fbd581853e5cbae6df65d39433c3931daecc2fbc7d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6de2db0e46a751ad30c530af06e87eaaa0e276fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b28d9d13eec02d4cdc2daf2313ec8ea9151a690ce4d7e492aca6c5f46e592323 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c105e8d02627887e8dcf941b35893a74e2afffae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d40391d8d1e4f9bdd2ebc6754ccae799696e1324fe17aa9550b076bb8a70919 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4f6c51491ba700dd7ca43d2199951a4ca8460bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dd99c81c75a759c5390748ff8127aadfcf7141da45a6877a144b07fae0461e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85911afc4f48947f4813b578a7977d8e19945d65 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d587339d0a368d963ed73047562a26432a1a6cf0a1b14efd64b9307386390921 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca5afb53fba195572b09fcb70ef1b9de26f11174 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d6f0ac151914adddfcb32059e23c29cad53be4a2425bcd909956f7f08f0ee38 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ef158922e4f4600f70a7c416499951831d1755b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:218b84316f06d46d3e74229d01d1592af203507999bd01e02e7e4349976f4ac5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9a1ca8fb449c45c1e15c447a783c7d3521a94aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03ced47ee5c52e068ea6b5100cba0969682abfb597076e4aa994da5f5f7b885e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83eef4939a96f57ee7f1be45e282a16dfb5d4982 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f16e7fc73ac587bd816e9aa7cac9431c4da1a66429251a6e1f6a756b5c8fdb7e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4858bf48140f6a3b557a352666ad83bd095536b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdc73e8a2e60ec508555cb398719a57d3b100c33a8b461bea1c603920e68b1c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79ba65065cb6d604b5eb4ae5d103cd7716940201 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039e14027573ec6d90254c470824f0656b44c6f0735aa7bfcffb8524bf11864d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08691aaa1d7b5cf34bc4a47aa07ec7f0a2a6afe3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24860b8ef551bbfe36860919a553c0f6ff12128ac8cf6ea72514915264e23d12 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b9e5f19dcdd51bf161a92d608961eb762940b93 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd9b6a304f2b86f7c6827e7b049bb3e6b47119689f3db940a0220d4e22723c3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e16abefd770d240b0ce1361c3fd3157df1dd9a72 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e4f7bf17abebae3e5cf2d03e41bb34c84d331066540a96d43afd444ddb6385 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5b4ee43cc9514ca9d93e782b373a4aef238c0b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:889643ec7b7c92ea6b5a88c7e71c15063f5799ca0c7ba450c061a82a7d99d3f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e50a235cd1e98c0df8b773c942c87fd8d3a8822a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d02beceaab8966adfb3450d721904f726eeb74c425543715397c489f8c87c8a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27dd1b6af6549668c4030d8da43f424d3e784459 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92feb9a9fb9e2e0a3e5bff6e2b378de3d4ed20d7b6392ced3edaeade5b4b05d7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..56398eed16a129d9957582945763758e27b04026 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67ab11ec4c3e562ceac2f1c23548b97c4b9d3d29a7c488c2988dd45bacf23798 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1927bcff6202879509ddddafaf9c357a478863b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:666dec29d0ca7419b3c7660338abf0a7191059701cddf0e9e3225e40680f8108 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eddb748525b25d43675bb5994da0f9e478c84e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4abf39e94432d729e188edd6b69bb777063731eba7624f6c846885375fc6cf1e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54acade03f0511080eba154f101e25108a6cbbfc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973b0cdaf7e67ee02beac9e099fef4dceced65e74591196fde23b8798a92694a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0267e1f7cadd36c336a6a8656d58d2050f7f13d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:402a3fa75e4514d38337364cdc3eec3005dab784418ec262f0cd091ca97ed420 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f89a7b5df4f9ecd3a78e9ca81becb2c755e252ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f83506c5f8cd52ac96aee267adaa633c0167693987ba7b411ff393ae95590d60 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b35c2bd4b0a7b7ad0dfcf1128c53f033414ece5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29eb8293548f82ef19387265fb7532d8004b240cd26e239cdf4733e97ebd7244 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..767ff70a47c66b301c00ae4cb9741662b3f87740 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:928136b6a4336c8177cc202f8b13fc565f55ef999baea7203a484ba0a12e77db +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d9a99c3c013f3142229d4a53da0e490bec93cee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e80cb1071f05857d016504047bdb281f0cf9cf0060839f224b759d047ac0649 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9e60e23508965805b49807840fd52e01c8ecd2e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f50a3018c99dfd635838ff0fa4d67cc3cdf88f94750c41f45f5c911a1dbfda +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3712ca015fb68c940180f8f42b58bb4d76d9d285 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc5fec268eaa4165c7471024a88decc266e40ea5ce80f77b6f26a307aa36f4c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d38c9d08f9bcd7496952d1306d4f7f37235d0b8c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4f27c600b8c65a85dfaaa22c08e8291e5806dee1276d210ddcd2a0c7cb4a1a0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..797a4d063f5bd83e7e82bc8a90fa7a5d0a9c51f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d85e5e9c80c04db6f5ea1261735de7de6897bf64149821a1cd7834fff62ca5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..289e0446b64d4c144b0fd71a147b2933b970521f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a3abd26bbeb587807772b6ee29de4a01771e3381e173b1670f5e61a2a9f44e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b428d338652cc4f76f803f534b1ec52404b8f6d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9cdbd532fe06be9a4b36d1259ee06f65958423ecd301c3dcd999805790cc3a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d6a49bcc965dee54e0b4921343679a57c2b346f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4f9c5fee67405dcbce9a68cde2b94b7e3feb4ff83deadb03d69fbcd43c31746 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48dd69154c0f23ff9c90f1cbc2c1cedf629d396b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73791a536b622b0fd4e7640140327d4902d991225498b7ca5283e3dc30b635b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..845c57dda1b2fd4aea44316479399f153e2e6316 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7d2b2c17e1f3d34e4858fb07762ca91ee717df55a5e745ae060bfb899e8cf90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..72cbad2e0dcbee95a4f3b3ca6afbc8270145793d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce8e0df69e175783d3abea17428ca1113227d1c39897c77b1e196b71b63d10d9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e8a86561aa6a7d061d698ed2ee2e39096a28a0b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ca8ddd7af5e92241349d9c2131f5680f366609b11e13b04e5f74301586f311 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7d2fbd033b32ff2e232ebd77f8507cb0b3a4857 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d89fdaf70764babde3d288d9e3caef0acaf664ee156e7daadd9a65bf40c03e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4543e07299b068f92424b7dd7f72f21730b9d677 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a8acb53771724331e37fd10a1bba3f8b144dcc97a974d0eea406e0b6a28823c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1499003e832b29ea69a4361eee9b35f1a3d6f203 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6503a56706d99fd99a6a96503728c86e10a51de80773faa3dd3f13c154c8734 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55f70330bc8e63c59335c1e8a5921268c7ce73f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7abcd1de002bca9e2c459c83b7dbfa6cb48cd8b0bab2fefc112320bb8d3e5587 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9604c9c57c040ad8be2b6f2a6af4072a43f2629b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bde674ceefc5deab586ba9743148283a6920b344d1fa27bd492f20017b72db8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6492e2fc6babb1bb9d6fe16dcd82102cac36e041 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29d14c0dfada202faec064dd19112da4a0f3a65c528a9194b3fbe35f34d0331a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38c10335cab500a17614b87dfdfd5f0a0a6191ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67103525c2c6661a74683c2c67814fca68c9d72f68d9f999571ae4e169b8522e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db8bdb0f07a5e87e3ef23579f18ed78629ed7adb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5745cbd1b6796678c27f4add391a364147f75691d3588f5cda758ac3abf7cc81 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..feeadbdfdd90385537883b2c882c97410dec85af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb9895c6211de3f1f8d3558b3d58bc45b527383413e81bd637045ed52e299db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef92cf80d8727129cb5ef19cd8b30d0c4ba65545 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc95014420f4e1aad4540a278f5125fc56baaca9c8f8d7a981d6e3a2e999488 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeb2e4e29ea252f6f43f32c6c31bbe34fcf446a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80cfd1c121123e56488ea2b580f71dc2f3d7bdcfe7a1ed361365a4db877c129f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d551fc8aaafe06f6906b66976a6cc547dd86c1bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:981fec1336584bbe6af46ea14c6f980e37b2e7207aa24bb882751db00ef148c2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..17b6f4fbfb51f21ac7324474d503d4e5b8d30666 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adf955c3c99b318caf8e8501562e2d903692c38f535459c752e6353fa9401382 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..010103d36f9e7747b62a016388d6a32692e6f3ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5757b0b12db392a967df0e4d4f3136ab73bb1d4ebe8f4e8c0bc5b748e56be4d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b984bd7116405c26e0858390c9420b4a3a8f174 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1db3debbb340b0bbff5344529e711b9dc8521a1242844a0ddeea7c347a0e19a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..983d2f4cde1d526c98a39f65040082ef162ca994 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dbf17c677301496fd5a309c8f1529fb80814e6fcb4dcfe36a123b0b670dbec6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11463ab6ac393aa70907ffb419c15014c090712f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:776ed8986b2ee26d25725b558162b84ca2554a663bf264d59edaf6d850499c15 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae276698ba564f17ccc80fa3b0e1d1d32330681a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97bc95be57550b1d15c0932ff8b2e7fd95e46c52f15dc1f5a422b1b30f018e68 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53f00ea9129727641b06e225f7482db6686a27dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c32eaa2d01c9619f69b2bc89253acd084b920487bb83d8ae760b924b305f838 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be7900643d6b66fb7d8c27b1bee9fe7a628c8a0f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f393b135e8a5403d27f924e01a33337b3599082397f26b85b897d78af465c264 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2be1d00d4d0a1fd31aeb65346657bfdbeb230cc0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e16753b069e87ca1b70b26d880dc8b0ac61c3d5ab9496ffd8798c6251bcc02cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1b2fbdc75e262a1a6bc2a08137efa7af4477731 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb5cf7d4bb223d06af1c662064ad0b67b470dcb71d0d210fb668f7c1a130e786 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..16b13f8a89b8ec63917a9875bb57fcee9dafd696 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9e965af4d501017c1a0a078f9736f1321ef47fd78c0ed6c3f80667c028e04f4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f89251589f669d1495f920074ca28773785f2041 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e53c291ca197a95f9e90bdbbb6cd7dcf4d4b55efb8e0ea59a3455d9f7c31264 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..02662bde13cbe8790d30cb5c743ef8f4420f5607 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de5ee536be2119057b37ed2b11544db49ddaf4949ab35071fa7427c86b2535c3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdb8205a43bbef9719f9a5781edd4698006cccbb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6bf75e048078b0a2ed355600fc948bfdb6bc32b1fb3ceb9d33e3c20f264a256 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..15f7be1d320acadea422b80e21b9f70cc9f7f4eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7ea17a6f248766e47fb26596682d73aa7572f172cd965a76cb6bfc75c7f677 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6723a42d19e730219b9a322bc571ce248addc16e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af5546f7f183e9522b8baef6b993f0ad9a769620e9bc19a45231238024a2c9e2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6e83cebcd6c734ef8289e8fad88573664a1bfd4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58f377d154e0c540137fea3652a379e3ff096922c3f67830035814132a2e2ca4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7de607bb6a8da15b8cc3e3f048539fe29ac4f5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d441a7dc53d2cc07019baec0a54814ac6b8ff9442e72d54432dc271587dd7dc6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92a27cc9ea71014359e744bb5353d23b77920b59 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f18dcba6527c44db1f1c72e698395e5506a50777c69e75e499d050f2b6a17da5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..821fb235f4676f6bc2d4440ba9b6f23c878f14db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5d4001f2cde691b7cb0722f25046723a49896019455b65948cd8ab340ec1f42 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0aae059849caebc5fb91e5d3bef93f18144eb457 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02132fe774b946cda144115d716035384a72b7a2ede65ba6b8011b4398f00c5f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13b7f2f063014516f6849af08c6b3018db64b0ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5435ea081f64d0a9fe42b4242207c98317c6158100230248ac6b96a44efb167c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5051b196c898057087804220c298ec660b1180b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6510a1c8a7f71255bd9dae03f28eb19139ef5e12b0bd7d615130859caa9aa8b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45f3d93f5a57000e3c1a46c0791705f31127bb73 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76848540e977808c05f6077c1f5e569f21f0cf0f44c6bfc280adf9edb0bf377f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fe763d7cbcb09e39a0ec49d96daa91a9ea815a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bcefb13426357799e21b23fc20f506b4a55f225a523aefc6dc030724df8f8ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dc8b2557e4eecb7104c5c1a778d2fb8b7abb2b9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d6283fd88bc19797ac148c17239e8ddb0f93b6c7237be2be39003fbd1ab2671 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75e53c9eddb47ecbc3205e4209842b336dfeade4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57fdea5fc495dad107a824422261b6c2013cc944c64d7759a11085e9aba96618 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e57f5836c0e2265688c0d117a21acb95f426d30c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3987f3d99ba781b1e926c80bae5b864ceb54d608a7b261bee6256f9076497a06 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7097218fd4835f581bf0245f2f4db23a781e79b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a20d4203ef61213137f9ee2ec2104f7b99344cebed5372dab425c959c96281f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa8d7d9c23bf2d436ad8261209b3686d60cddb0b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bf60be9762c69b8c8c86d5a76918a9c42cf55b9e1201defcfce06adec82d651 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c8e774ffec72a289c9584bd201d498157d60712 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d32636385b773e83c319b5edc92b42738431db656cea5463b1269177815b652d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b6636e968846be44bde4603a95a105bad6cd692 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:470c6386159d2a449b8ce405820d8892bb82ba478a0449b5f3dda67f617ba9a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5842ea3483918ed46425548854c45dc4af898c42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:255abb33573a1ed66afbe3fcb63710a395fdcd32bffa4293065ea4c083d90ac5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..317ac34ff353b67734360c04ae75ac101c762168 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d06522c47a7c22805bc9b191b5790e85c06511a85c42c73eb450882427bb2e6e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1caa8299fe40eb37556060989666eb59901332d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaa6336149a8fe2a06f27994343fd8feaeeea53dd4cf1cd30f190d91460a1b9f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..936575e0670c84c7aa221b1504c923f8c9b2aaed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d36c0ce85fece785a7e881c53684d5825e161bb3e1cec71abcd59d7aad275286 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e5f1b767e32ccd436c5580ecc0ecceb605b11f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:697163d4bf5de73789640d0b7efbfd01e63c8efad4000e59d29a8be6a9fd1075 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6e9c59c9d385ea76e81fea25795e7a4f251756e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63132f0baec28c9c38f48ee4c391a7f3fbe6f04d9ec3b92dbfae177e91018358 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79b56e2cd7b7e3bb5f16a2909b474ab3303b8ddd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e5e23388d052a10e11879bab4d06a6ecf8905fd10bea602ef9616c7a47d93ff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79a05f297c5626007ae1c903cbae7d91681bcf1c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bde29fc8231e05c044ae6ebed111c7948bb6081eeb4b25738b93455a3b3c1b24 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6746a69cb866589cd0d565fc0f344e619408f3a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f760cb357ca4bba8c92bc1b3965fc968676a9b10f6dbbbbe5b77ee64378b3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4a40bc4cd3fb5b0dc3bc4e74fc1a923082c22b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb03ba02a2f87a50cc2ebe7d01cfe2c34783a8765c8cceb000b00e8d7710cfd3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0245996553f64df5938a8bcb04abd85ba9b82f42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b914108ac81b02cad2512d880bc9e68d823c735bf6a1d769a32d72070a4b378a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bbb6b445b5ccd249bc36814274401b6519e9ee4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e60b5b3c3e50148313164fece1d05e3b4beba2b198f18b5b623d7912a0434c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..45a19b3dfd77e10611fbc14bfe04c6d32910bb52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:887b1a53c6a47f23abdd7e572113d5a72347e6fcbc41a74862c15dd05799bd89 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..266790149e19aadd68ead0355347821a6eb9b0ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e9fbcba6e0b3a4db4f9edbab737dfe15feb702009a1fe4ba65d0db3ceb47f18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..39d1d3a8adcd5f570d6da38a708f897ed728d708 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2274913e9ebc6d7348ec1bbb9674f9c14b7112f88bccd400a144b9892ccdf010 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c909b8203dc44564d3d0b3393f4227e9c13e845b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d9931ca4b7865516cacf76f07864b21027bb9d38b0911e0671e39499304375 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33b549c9c7058e61b67b60d485efcac02f044835 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f7b4803a890eb5581483f91f3b7e12e608078146ed8c0887dcad1b9b5fc4e88 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..730f08f1bf7c8d3e4c73783eca444c8e39875c7b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0150b8ab4c9b322c8342f774f0116265a1b4adedf88844fe150f52085d96a864 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e900bedaf7f0bc4e6653b9137643e5a833f4659 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:124472b6e678c2be56714ae0f69e2a9a3c8938b0f9797c06b86aa7d7117b36d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba297347614a05b7fed73a7d93e975aecae09d59 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d989ec5ac8e6f9ca39e74032db8a937fb49bf00e3e029fc6e99f2f46cb1dbd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f4533e1ac551f2ad8bf12c27e5e9f162f813a7a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b79b6c65cce87f89c495ac46e26cbdf56b005c1127def50ea887bd39cf1f7cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ed298f6ae2bb5b3f869b08f019b52c89c038716 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265316bcd1eaf045f57d6a17823a61de4da04750d3dc0f4716505517fee770d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddf3a13b8fb866e6c62a55076c9715f217ec4a74 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d0fbc7a8eb5f2c82d44711b0b2e8ebfbeb90ece95ebce287d3015e8015b2689 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2528d073f713a9dd651e6dafa32b6610c3b4adb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57e784f861187cc841558a2cb45e72af3a8ffd2fac86037d28b63995f7e72a86 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dab18057a21f14b3d7bed11abf12e7e9840fdb7d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51b3f5b90f745dd10ec840346640090ba6705ff3a20a0382c014053e28e1ef50 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0074fe13f1749909c1a5df04acffd93bd020b282 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08c2d370d9ba65e3f34c1955729c920172ee87980ae0767d4ee5b0de6e72432a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb75d89124badc2089891ab7a34a23672a3ad0a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:141d5031e41b66454096a2ce3cc40c8f7e49a67c422ccda18ab120599b11588f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9034ad384009e58d0004af18f96c129d107f5d75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be59b4e60a6559691cdcc5bf134191ecbfd172370b4038e4e5aa57db79fe19a7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..896c74497134dc4c6cce0bb296d09fc971ee2ec6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48596e0df9e517707da86edcec7d7b7cf23ada07d81fbeca2bde5b313f51761a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3fcd4f4c0de8bf312fa6bf507a8ae30507c856d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f098f9941b9ce4a3ce39ef3b2f3130613848cc7e73f6847383b64beed8a31ea1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae9ff5ad725105d8f17767c68f2aeff2f4eaf846 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6982ca69c22bdc81227dbd2d62f9f3e298c1aff5c9b750c7d5558bc837960fbf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..541f856f49773f91c7f1305fdb609aa6d125f870 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bac750c0591115756ed17bcccd854182079f5369e654d28a39a5f7adf2c2bd8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0f1085cdc97a55f411426a04614c8282eec8d44 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:421720f46fef13cc5731d2883809eb795845e3156b64d7e4e31131188774538d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6acfce4e5b4806608e4ba188a5cb77dd3edd540 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2243e70204c8720b1987576c23c4962e9db05f8c0879da6e6f5b98324296706 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..47e1f440d56e4e0f2f59e33ae365e69487651d8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2798ff73cf33b278f0f9791b6ef6be12fd30a062b821e7e33aa9e269ee31d17 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec9d2d24e223d06e856d35c376b43bbd283f0742 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4e03bc9e71377833b5c1f0a39f3c92c96561a03527dbcb8fbfd5c35e602b90c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c56605d743d1bd521adcd9c9225a0a9d72903e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42580cf77929fc2a9db600cc42404ca6df74299be9385c44129ba9a4afe377ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd2ff39192fc171d558d60227a66b1eed8604939 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9357b433b2d846ecb6c307b999b614a36f1d4f157021170f1c210ebe77716ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5179f00d1689274e61a6ef59d9c361fef68a6b21 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d111557929f783128809174220252e8b8fa04c44a436e2e6d2884c7314316e62 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64bc1695d72bb5b78cddcc2da2204a352e8fe74f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d219dfe87dbfb5adacf8887ebbdc0926132faff5bc4beee24d3d33edeff1659 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4216dbbd3d551be97aac5921355e7991c48a7694 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70655e1fcd978d281a483327f605315725b54e282c974c50c144595fbb695dbe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29828a09b5c54ee4f864c318b8c8436b9dbb109a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a892c3ff4a3959def42ed866a11d9ed75bc79df60e9f5ae44cf5b9ac41a0354a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aace41641683ad3076e348f7b770936713f0dea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d6d2e3c49c154fa1e5ecda7cbbebb1ce03046dd93e5b9abd733b93b3c05dbff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c939947ca5f5d725686186ff87d54ae36487dc40 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3e593e452080fbc9505982a71c6dcf00874a889a47bdf40f5b8bff25d75b6c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..78f029bfeb814a3c386a35e3f4b6886113a1a35c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcc66794613d0755f863ca0f871d0ff957b4257933abcf1c214e5b158cfd595d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..868ce6bc20ff398cc4a1467381f1ef529b35ff8f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d360df713ebc6b168fc945c4b592e1522a2e9a996f4ee572f66d4edf75ad2c43 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..47780086213fa156388922f6689f38a7ba9586f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7814fa584313c9689aae254f2b9dc102cb88c6726d65fd628af2e716785180b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16aea567d1592277a5eac283231298862d4b228c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a8c5e51a0bf4ff08007e0c153f4c7a4a655fc9979a8e79780683ef66fa3024b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07793c0d2b68c8dd8c7319181fb2436501d47cfc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c0c0571dc0c49b587d8fb5f8b951ab54522590302e9b6899da2d48469b7c12 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b14f89bd50d5cbbda0b8b93f9e165c4a70f634f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:410a442f3bf98d5ce722468a4925616302904f3f649e9c3d615e3c7a23125ba8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffd75cb3c2673d2bec3c6c6210aac85ae3a205d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c494b70bfe957d08167b292028bcebac1c1aa24738f99d3f631146249576d5e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c87dbd563b1088a0ea35b8944da38b9348b787ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:711629b4cda2de67bcecbf4bce7da26fdea68e56f7ecf4e83781c8d63096f620 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1862b9924bb04a05abc03bc2a05b0053d76d856b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3eeeacf9e0dc4ab0c25625d1d2a9390fd5375bd77b8ed22eeff19bfdc66aa00 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0bb8daab955a45cd88dadef88c7569325261b39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8e8e472499786d779d85658723ddc80193b00a20dd5b7d1dabfde1f456c26a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7254d5f572fbc5e0a58b3760f08886f4ce72adf3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5d739f79ef1509960a87b8078d955dfd2b751d624bb3058de6814c817298c30 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3974fddc02cb41a13b3d1678ed4553d31ae75bd0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2e8a89e759b14e415fadcadb4f52e32ee6cb8e4d02e909b733c4d0af35a8ffe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8525616a23870f9da65d59e20b4b8c5dedd28218 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513584ae6306bba4ff7502b6df5dbdb0ae4635a51aba35474b8032a36799101e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b3c94320d819e8e73298fad6a2473099503c2b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c8620aa638da26c69817e9ad5f121c53c8faa59fb5a3615542aab6567af89c3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1913c07feeb214112f176634a54466d6f2194088 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5dd623c7319789bb7d8cd8e8ed4e98bd93e07ef8085f33c3bb59487f64b3fd5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f77282e69054846f39ac19a162939286a019c8fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:932b04bd81b53c6ba74fef3a77464570906f3d53d7012b64d53991715c061b4d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..19685980332311ac9296cdae338ced001ed11132 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee583f886059e50ed3881959709553693ad7e236f14bc83bdbb2e77f12fbed4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75d1aaf2cf0b3e1eeff19f443160e4fdfe5d53d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcc0edde20294109bb8596358dde19b4e15b1147421e89017f41fb0be00af0a0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dd3e53e9d2c69871ea5fa539eac71d6b533c7fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98a00e9c661595143f8abd6412a4c204301b3519ecf5e3e46a8eda51e5357912 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87066a7d5f72be491a6c8ec2006d35118f5c025f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:079bd69f8c5767f59e58034824de54473a05eb2ea69767d59fc0be10380b2b8d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4774077cfbe8b25b9a8c046fe786cdd641fca42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27dac2e386db12d2dc273ce368e46138a2c86581391673b6aa549f8f68d3b491 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d507fc9c4693a4b1bc8b85dc5dae07f90735844 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:765985814285308479e79a83708d588c95ccc4e8090d92b849f0fb52c188556a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..696f86c72d6171f04bd5b4a9bbd923ca85898a60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0cfe731bc339d970d324fc1017a67e8dec2f857fe18ab54982a3ec57b277682 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c81ba219861dac5ff1d8ec4efc116f47a8800a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a76b49ae95b5a931ebbd6d1bdebbac56e59914743305b90f797770702af1ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c43a2521d92d37cc11d3bc6cdca86bcc76db774 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c80333e81f5b0518fa2a86e68f8cb6241263efab79ea442de44272d2a28e13 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14eb172069deda886b37544a36deb311bbcab446 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06efcdd9ab399ceb116b56270632bf7022deadb8742b6ae364df59f895bec8af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c99f2a1e3e1b9be0167c0252aa4dee6e2f4b805 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cd66062c992ba83dbcdddcde696f31d888401645cc900a9785cc40f18665a18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e256f4bf82410e58e2489c1938d2cbc9432cb21d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c094ee7ed90d9bd4918c57abfb943694aedc5e6ceb08bf017bc97fd419eab75 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b23b237d2ae6340de9d94110e4723f0703e846d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee6b77d2e479209921861017ed3e6a1fbfef4e8b396778fb582587ce8e1389b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4193933ca126ba29d951e111826e0cb5157acce4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5552db375c03a0b1d7e3be8c197bf110e2043f37b3b28c6ab03ccd3a4bccfe45 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aca5040c76527d5fd054b293df6cc68cfc33069 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99e15a76ca190ba184cd41b389b381941155832755699e97abed7c8dd1b5cd1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44510c8a3c9988025e0eb42ea1f1c31431463160 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f54e216025af098ddacd0d7e8d9aa02bea6f275b71e2f99accae945a752c426 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc50d9bb7eb5840670e2603c213d840bef47c484 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7967626d9bd848cca1aae1cc651eaa5116674f05296d3e10cb43551563aa9a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93d462d9571408d54e6d8035bfe59bb644224d77 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc0d3186c25454bcb88d9acdb9367d21c28e24f84f8d2b0916a665a9b70b004 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..68aaeec0f20f9d39567bc367364f9fb33008ad20 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02fb174dbfbea626eca15056aed09787f58f4057ce6435001a10e4062fe96d0d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e8bb5652ac9ed6d141e7303bcd6de60c3f126 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e3b5461d8fca6e1797434ba7a7d27409fb7831706bf38d8cd7e9f4a925229b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fab00cae9bcbffa16d07852a799d6fa7dc2fed2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e671ec11cd6d6cafc6a404edaa490a0d7cc6601c4e780ee1e7488fedf471cc4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae4fb2347a4889d06fd7a577a3f3ea4a54d387b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d4427c2b3111d9986b0dc58c946b0f62e83c36b79e9394ad87ee8560ca2e9eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e94da46bd14a4aa26c3c946b0ab10e551ebb95ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:397f059798606a0ef672e86975f26a81ae07834c6c20dc9c77947793b5beb949 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c68041dc8da4e0d9bdef63e085eb729f93b5793e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39a650c6e854ead764b5bd27df03761468d7656f6f9d665e777276b3ac233878 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92f31f9dc6f2646067c62188ed99b1e02e38a83a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56c4cc61ee5a56b63dd5f8d7cba3ac8e6103bee6c184ed7734ff6084ee738ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34fd2b7be9bbb61ebcdf3a5971b99b8d33c8fbe0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a79815ad0fc9c9feeed0c4651ce959d746e5511149ada8bf51fd7525a61892b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92692fe2cc1c705471ef9d48206f20003b662472 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66c2864046f0dabe7c4294618c178c0eb3bb4cfc0d0f5dd8652206ec5d3e4781 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d02a2bcad89c8b2e2eb128364523618acb39c3d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268b90a89331e288f2028aad9c9384abc3a1833242e3adbb4c321e1dbf4747c0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..59d78a1215d8f3c94ba87c7b9a2905164071464a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:416e6c7f5ab5ce04d796196aede6884db36ac42c283d4130cd85298f47df68a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e60f7bfae6f5686c7c2ceea31ecd62b309f03b40 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07e16e66637196af4d91a6298466c055581d7b49fff0cff916b02f04723b2437 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7957fb31c9b844718db068d1046bfefa424f8dd0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ace1975e05ca33cb8cfefa60c7847882fd55bafb272e7c6f94cbee2ff4b7e87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..186068f6b17336f6afb44f1e1ea34ac2caf2e142 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dbccdcc6703a520df4da674451b02a8e6ac5aa9e6999d677e3e5ac347326b3e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..797806b59dc0e15e5fc0bd6149c829b23cce8607 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95c39059294079dc3ecce456625b2923cb49c16c594c702968310523c73cbadb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b57b10dd5f3bb1ff87633e003d1fe8d6ecc2536c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30f3f95923440c8a45342c2649d4f975b0466d65ca908a6321efe375e4abe1af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6745f77438d81c16cfde29e5ce9dad9e7624df53 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2232bbb7bb2cfefecd95d77ce61c130b1bf9b6905fb0bd6191f331832698ea3e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..544bab189e18997319649cbd1af90d27c764b9a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78029a62e970068a382d50934502838633ba22b518fb5f614bc18b3b13f74473 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a8a2e4c0ea163c0c6ad94616a5438c18b2268ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fd87292f5672685b8ad3e4ecdd23614424d6f5813cf5d61bc3dca087bda0347 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c042040fc36ddd409b1a93ae51bec71589904f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b1a258f75dc0f3f024b87ab99dddfb452245a0253bfb879425d3e94aa92ede6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..80ed32478eaee66a32671d8c62d91385fb76dabf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55bb45d3ad6ec1a3aa5796f350ef1dada9ba9a2ff7e2945045809e27f8a3fe7f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..876232404984472b77994db6caaef0f85b1b3646 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d612e6704e08fdaf56b3f68091e77c0373fcf5af8620462cc105761deae35a39 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..032d09441bf90aaf782704f8f71f7da2ea97fe06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d0a6ecfec44100907f761babd80674a43047098eec65aff7cd962eca04b977d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf4b2b45fb4017134ec78ceffdaccdedfb89c2bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da5d5b9515f1edad0cde8a63f40b295ec79a67547f2dd2b417bec2ad30e6ecc0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..05777288df8afddb154bcfe63d2c0798feb3dd84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7121c7c8ce1291eabdd109b3cde1f3f4a3be950834c39553617dbb3b90f30242 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe5acf02bfa58775b8d6c8e5ed575d556968f28f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3892281a0ce9c788065aa83524a6c3cd72e1261fbdfbffe83ff629e97c6d554 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..efc166b82831bb7875c954453c62abd605017e78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:582f936e7e06d3161b4ddb9d030d20258d32a08f24e067f0c41f8ebfd6bc8a4a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..caa1f748d8d20102ea889152fca64a114378e17d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3290c477395de8afbf959bc36d3b92373520fd3d1e59823c579f650825a7176d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1b7bc965ddf91630bb6e65e855fa8af8137d6b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4780575526cbdadee8c039a6dad8a7850153e4242851eb717540b9d63631ae8a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3daf921f386bb6494fcf0585cfefa1b2031e84eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d2fbdcb87c5eafb9b5bb39c669be13392d20444f336093da3e77638bbdf11d4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..510d0bf8b58ebdbd242d5b6b052d5812c1c2959a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:117bc54aa291847a0e3e8b8aa042738bd3ae21bfd52a7cb7d7c9f3f0b2d526d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61be05670adfe82e108e946e0d28f76fc9b174f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dbddfed97e18048a2bfbf317ff95d098c4f8d27b92a42e0c8eee3ff08741f84 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cca97a8588b543922e158fe0f5408b783831040 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca2d73fde87d6fc32b042175f8972c6f5810c1864b75876c92aa3d23696d2d35 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5211d3544d42ad08085ac3584fd10f1eda71035e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1e6f5f62f7486cea3fcd6e9f506f493873f933b8444d1cab60e7b8ea352f3c6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30334c0c03d612af15de763f7d1f17b2b052cb6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4bb5752d5dd9b33232546ba7839cee5e7eb6767e87cde167a10de6c08ec050b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef16f077580a0a68f3fb39ca3e786d650821e885 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b11ad5e8d5ef58291aec717aca41d4aeb37dfb165f251472a748b43b3ee24761 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d16f19f9600f4d81015209928fb02c48c220d87 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cebcb16c194dd0a6ce318c75eb5dd9b132ef2c771316a61740a7e85d1d9dbb31 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05de50421273e5fdf51da5faa075e8d067ac9526 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2253145f313cf76b95a7f4b2502d0c35028121fb05fd5356ff291b65ffd153a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11ee6f64cad896ebe3223ce35c7f0bb0c3a58bc9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a988334f8fc478b25a3d0f18232a348558b3015790f571494903b7fbab9f4fbb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..beb71663d5a6f82576cf2e66717bee983ad9d1c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab11fe7611b7cb0a096f76f5dad85251507fbf136d18f07de15d5ef50e59005b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75f5877e6eead0f4538782a694cb743f54d3329d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e5c1774469fd7ea659db9015b21794f8cbbcb5b33b7d33a111eea9bec431b6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eff43d5813ba02bd46c5dd51785aee58ac00fa4d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad4ec6c9f1a8b961d7f54f4d67e00095f9e31092ca2227ffd1188dc0a0250a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4025175f9209fdb8f9444289b53b712df775a5a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32363de39e3b463f1f886217cf54de6937b93222895f50f9ae20149ed6200223 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba998d78660eb51cc93d811ae76ebac9835c30dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c4d85fdf31b3e1c93a258bf9792eec222b95a47f1d6f2d6856337b0652ce595 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7479c3c32e15731157c4093d6cffdf035d507936 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd342f53e1c4962cc8437e7f448bd2135c197f7433631bc2e9057c10d196a03 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d6367a20a9334466dbff3b9de5a9f5284ca68c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec0ed031e88db0b98bc07fb11103206707a2353ec092096aa2c6160a03c18873 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..450820c06a3301bafe4d15d3b00e0feea048e629 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af29a25fa12a70719a8b4d45319da8a2a3fbf57bbd5ffc01c20f7a1a3fae10d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bdb9e45dbfc71d1fac4d251a52922223238dd09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d501abd18db7f352b7ba35e6d46b4e76f38d2b227dd2c95dec679861200aef5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df6f28275edc97627bc33d5ec8c81a55417d9988 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bde192c47f169d41bddc7e8e14dc66b3e5841ceceb3f45e828876394676b0aa0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebdad95446fb462f57b8227b194fedb1d5068675 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5985e00e75f6c97fe2e33221e7b1c22c77d247dcc90ed77421291c63e7a6464 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40d7af1b7e464d4d206a315188ac4d6e8bd75260 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7524d1730a0b0dc1b4dfe00639407d922b94ba367c2f72fc19260f75ee80bba6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0ee10bf9ba3fb6bbcd169659736c4444c8685e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5c25ad84b22986af4479bbd9162d2a72fbb4208ff8270a49d8e6429b0b86c5c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a30db61ce2b022cf8d820362d18262d8c294f077 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a4877e18fcfa90facb4222101118ccc2627874a59e4222b9b97e9b351a2040 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..acd77ed02515034f2f3ee5833591c4b769c6efe3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f05e6ed9e2f48dd60ff0e28021857b8c3a1b8e4b0157671d0946cd9436162a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd3c2c316f35b210a8a8a6d05141b02e3571ee31 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c8a940461f4bbed02d8ec293fb730c314985ed20c0ac4c541f6ce47d89a876f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86f6e650d946f9fd46d7dafda151b875a0743e62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:413def10f659f7c377315e2e11c7c781ababe15fce3625764655decb91ad23a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7d305012ddfca6d1c68dc3fecc7286dcc42ed41 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5d033e90c08fe4c6c28ab060050bb048d1c0d5ba78e80807a53dfd72e2a03bd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a19370960a8616e3d6a11418f1ac0ffaea501562 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb4cc4a02a8a81b983c6d11d1a4eff885ab22ff7000c61e1b74ad7f7e9e6031 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfa4febf3b35d4f788fb87a4ef183fe91cedd4f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca664a31488652d4a30a9532376c5a5e93077a39d316b1c1153dc98bb636ecf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a71f0a1ffa1493eaa9fdd182e9f84e4ad116f619 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93fecf51ea5b2368cb1c95d49f2485212e1521d29ce12d35902594b7e394ec7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc036f7ef2e98763605ae886d6256e1167292e00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77cbe903941bed4e8ba86e43e5ea5eac83628ec8cd9216619bed3c3eb54fa9f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a455828aba762b1c50f6da05c2d898c798be4e9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f816e5cd31c97e8f4b2bc2f1dfa87464c97aa679b464b44bf8dac11580fa62c3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..722cb4165e59f554a0c65e132a903977d821ec73 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2008e25540a2c9e8593a5763d56b5b1be2b763d2162bd5baaef81b825a609a84 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14f8397bf84f1e32dae47df0427df3a99511a6c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bd22f98075f657943e62cbd44ee4fcb6d4c8d9f8c30a8094435150a1d9e3800 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d1c564fcdebe165846ea48f393c86a3f481c20d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0720271fdda1b2fa7c7f39047945e46e9345631d549e29d4e8ba2518a75ae7e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bcb20ff8982696a9d6d2abd67e02bf8e4a42224 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:811b171a2a5b70446723de658d0c404fc02a2fffd06b133f02d14ca63261a5d7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b1f482cbe258897464380f00429bddfe801c828 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a1c7c7dafbc7a2d9b7c8108fb144f533fbf2ee3889edd0815f2cbb5227ecf76 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..565f0cfcd233f18afdd918838b73f141361fe605 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ce991a4e84b7b12abd11e6c72448c14f5349203e967fbedfa257dce12b09a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd922581f92b64a7aa91925681f32173fc48a06f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c8ee0ed76dcacef00c7903b86c9686f47ac9954f2c4ab02086fefbdafd65527 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a01278f022811c1dcf313e53184228e0b2881399 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a0708c5c3433b2b4d036194c9028acf1fac72b5f7ec08e74078d1eddb20a4ab +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a35f5371bd7b3895596a39e886036eba1c8c651 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a1d2ec09eecfac88e280e69fe85300ccb71a13ef63535583ee7231d7fd83cf8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7257a37a4dae3abed6ffcd92dd943f4b0bd3501 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22627d83d941a8b0bab567424115b81aba2da17c58b73ee5ba2a86806f19274a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dc0794206b003003d9a027790aaac1c567d8300 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0244c798ad453b36a84e07b9acada0f3752840646d4fcb1eaf73e6ce656ef19b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a52d4b499ef4f95705f062224987834d4978c0f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b38435ec95f7d911b4099b3bb014d7b62e288eb08e7142b052ec7d0c7a2ebc3b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a5ea029a534a4addba250d1246596017eb302b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c6575246d7ed0d61a62661eba18efa6b289585a6eda0acfc76bb3df1e752e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aefa646d873764e06b617564f681ceca4784feee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6ea5658ab55155ac59cdc9becfea2ec05bb2cc891e2bff88e927c22df263d3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..26ff3b6f06bd31b8b51f64eeaae3d762d30d5e07 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4487ff09f69c1b4eba87e88142bfaa674c41eea9f44c2be5dc7d6ac30663c985 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48d3079ee0491ea724df18be5aacc4d7336cd2d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a10d15547e7befea3c298fcc21e364c455695da23f54ac86afbce59e6d9edcf6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..10cb2764d84b1e48b02b672f87dd1530d7989dcc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:034a1c4ca92c4904695cf7925663bac3c277f4fc26cab3686c34e918f1ed467b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..910e36bcae75f15b364b5da90cee192012f01ad2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d35fbae415420266facd4c5397fba1a3269dd4abee7ad9635f522cf950006930 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a95cc6f3c3e38e34e16b3d50d7528155ef92fbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d91eaac57710c454dc5dc5e3c6651852a16acd952f4aa4b984c55e66ef83ac1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2c3a37b64bad2577b3ee083977149a24b26f510 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c33b06a15b096b4f3c5ed9172a6932b0ff03c93e830ef0dca945a500262dbb9f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea3f4fa58494f81c98d514ce75f6c03e4d977139 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59a3e6c1293d939c0b6d9632db4d5d18a9cf5c544fa51e7b332d9c5496216ff5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78c855f82f3b2d0af8a1bea79c691c4f27ade7dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2263a9d460b444415776d1e4258a9ac3c54fa9c18d5bc4b9e71a49e4a6e02cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55f2be7a2a7e53f44d81c1143179c985b5f7bd52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a273b608e380523a94c8be954b82822c5b8619193a4b91b839fa50b948b6989 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ecb2f947e872036eb973b987e808cea639064ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c87af541b482f29c96d1d0a3a3aa37462b777598d56f575a4a587bfca301d24f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3074df8d44ccb53aac9b6ca2733259da8c95df6a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4cb7da3ef930ca991b13e9bfae77a0cb02cc8bb3c735ce96e04a373688db36c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0787992bc4cc4e8e8481c0b702b9069ecd10f729 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cf7c6193af66ac50978e99af47f4de1af89b7a841510c8e56accdd0b4a41b7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..61a047e57ca64d156b0f4e1e11a1135a9b41c107 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b858724504338f24839d1867fb96e179576e8e6b86d814d2eac22bf58e0a00d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0e8598f305be6c0aa0be9efdb87376fa3d18b8a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fccb94c5b494e21eb346e22294405ddb3af68084f385c29cfc97979b850e5f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c425e5e5d96088e04b89e5dd62b0e45c566edeb0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6b33e88c9f5c79fe49dd5a7aa9cccf0a2c2574391b3c1be354cf3a3c57cfed6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9552f8fcdaead7e921675c5097197be96e875515 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc95f73e4c73cd053672e413df3335d0e483131aa18008df19d89915ad97bb2b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ef77b00585db40753d41d074d70c342bff80c9e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:779296f0c2e8a9d0af87e73acc33b24ab9a0dac87ff592adf68668ba1ca7a49e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7d74762c81eb8195905edc217c593b13c231de2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a92fd11fd069736784ba798c4342f2a5c11c41852fc22a2f854f33b13b80b265 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d70114b443b13493adf6cbd2a5feb20353a020d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f5e146ea251c2ec99cb0a8ac720b19bd378db2b7a4e9937ba6fb03318de5e16 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c074f2aae36048fa2d09477ea84fcdd6765082a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:317be5507566201358da3922b310f5a70a038b73fd957ee54de32d6db8cbee21 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50bd2bfc6d91c8df3b7fa41c7fa07755fb272e8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:817af95e54435626068e002c07a36e203084861cd2cde7f5ba06a982b1255ada +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b14df2948aa27009493642359568f7b9ebfc0c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a2ae6aa206634529eb34936202ec4f4bd36ae640f75d955620c3060d0843471 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d394c647d07c7d647cbc500aca931a582bd5ca3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:842aa9fac78276046e5d1d7a719e0783cb4fab468998f46f78ce6585c09889b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04afe4f3fa8b98f070db0b87d495339395ea78a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10fd714a66fe45e074fe274b82daab661bc4d44376c9edd7a15fc725428e9e5f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..558238b4ff9aa7d52d36daee1f340b74d14ce737 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4820213d2fc51f78b7b0b15b0b9479d868b9125150e22d096b6e1c606480556c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ed6fb502fade4b2b33ff0342b4f41d6b671a182 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58dff555e0c7567ee9026ce2b0c8a30e7ea2c8318483cec46a55c3922ade6de2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e96a9b35b1198f5fdb7102b72c45da225473d784 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3448f95e3ce86b5c9a8173231de325e2faeff7534e9d462edb2acab30e079a13 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e04b9ade4dfd16c4c9c219829b59788a23c21168 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1823320f3716c44a0102a46b46be80daeb7364b3cf940444d14c0a2f3366979b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..adc1e5e68011ba40f71e6cee6eccc26c010dda9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df74eba54a83ba24ba8ad442b1cb69c489e6a702e24c134f736e6a296aba5cc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5fc5730e75956549eb57ec204093f3ca3da7f0b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb2b305e31648b7e7ce51318a9eab9dc7810f11d603424481e6cdb8739b76393 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92de655021ede549983f347c5bc6fb4ddd102830 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087903a2dddd9166f99e25782ef47de28f78099cd05aa894aaf3a5cdaeb6ab80 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93c237a602bafe7ed22052cae54e6a2a769eb766 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0e6c0f98c7eecd1a28b93f7be6c1f394648a6a941146ba5ad08833e02dfeca8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f27bd52ec634f8d82fa9fa2c4af0c0fa3313b137 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a561858ee241283521546fd054db47c70796e3869572cfe5fafdcd3187acab4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a633848511b018d7e58d0336fdb21bd5219efd9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c561f58d20d630bfc2073a0c57faacd1f798f3763e27c987346fd3ba5006bfd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8b7f2f24dcc39c14e1adbd86a763aaff813f9af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d471d583c069fe6fb90a1b7a941d886cfa54dd954009cd121dea021b581c8d0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13060bc673e7e5dc9113a4ab3bb937a408573014 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8ec2d07c867138e79b3e0759a1e8d22bff7a597ddc72db744a46ce6caa92d75 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a9cc1819832491087783108402d3f0333748a25 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a0008a25a13af56e90e4afdb95d40f9b156c8fad9572135da533be584d614f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f87a034a3bc9ccf4594456b0ede5b7d42c3d40c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b230998c4e553656e6b15cb43f705dea2db8853cbf01d55848d38e5e1f0a8b3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b0666f0f3e8ae79b1c417ea7022feb6a864cec3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:534d0faec5c23c8d6c335bd6ff36886307f6eb84489989d34c3c88919a823bd5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a19734c8c1bed3a19488a798c8371b45a7d84c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f62305900b40ccc034b899d4020810a3dfba8f80f42feb197977e5f336d8fe1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df51f2af8badf3decef0ea17e627e59a0e2a9cb9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a182430dcc7956a5b8ad3b8c7bd600926d134bdc1716e959238a1596d5ecbfe +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..43019b95f1ef07d1e92302f7568728e5f9e34c8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c518822069762b395346d2583f3355761c186b886932638f73d9e60d0c46d5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..870a969b550599fdf3e1fadaee58691d03b8f78c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8026d01eeab606e9e597196e7fa6137bb17d24a504bd3b328240bbfc9fdb9fcd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92a6344b8cb9f16c4056448d3a535e2a7e893456 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbe794d9b4dc933f0bd3660192c81817e3233646e79969f3545066e2a97029cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e71ffb83b5edadaeb2e6822a5eaf581a5884061c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:383a58cd257c55a7db763fd4ce3fb4829a09bf59f1591926df8af576311c89dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71a72abea7999369abcb0f9fa1a28604a9fe98ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a6ee3e79f59a3d649235f2601a6bac994e1ffc6b0a98d39398621bb5fc3308f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..898772c4ff57e1c0809f631e39e4a63e80f5e1b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:008fcccded98865c3098b10805c29ef53aca59ed474c706e7ee63cb1dfca775d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cf5c110dee4244698c46157351fb7a1e572b4ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30baf10014b3393f252995165b48e268c4592c0c151eded9319107f6829530d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cc7809995b50294b2def1d312f1f00f4688adff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b9e6251c5f983f689847e0498a98ef34bf826140a40a0f48e2dfce11e9e6cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e9ec788f30f30933d0ea174667c7440cb12e108 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bb78e3898a3e05ce042944014cab42e07f98e77f15756cafb0a7cf0f11cf9e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdb0e6f95e213c70c86d0d3a7cafe75649f60b5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:149f817938602543e0b276ea5d223c6dd03c9c33a56f3cf025a7a347cfd2da4e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7b014d6fad250b32388f48abd23edfa4e846a33 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28da557a41dc0e3006623010f505caba161cae612d3e5f0642e2bd8fb62c9f0f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f2f9afbccf52c00c0f137d309d9585b6109fea3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beee581a449cc71075909723065fe9d2972fe722566fa2a4bf18749c720e46c0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e9c0f2ac2f0d66433333c85e499c2c0bc4da157 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:733428477ef3012e1459a4a08601b5897fc69c4c10ad7662b492b732a55d5855 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fd3615d72416b2b077df1280f9fd30a7c23ec4e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ba5bd720eb7a975532943e37eca27a0c83133a7e00afaa1ba6a4d032f0d14b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d561a27e035136bd2b30afc6b161963bfd4fc8e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5dcf40628d7ae118f40635b68d727e5a8123630bdcb7fee65f1fc97f4cec8c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bb74d1425081f5303737743328a07a1516744ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:770cc5f52fea3ed36b81d14970dcb1820049709ec0ac4ed2f85b55c878ad9546 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c426c4d4af464b8d37c2d90186433c80c97f3e3b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a8b35d27c75e18e20e4f4a36071b59aafe0a892c5246c8c9e211eafb91f5f26 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..821b238d85453d46b4e31f5823f4751493a92d74 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dff32802dda0d748730e897f227e27d4fd8bccd6a838e12163b49e9420e10bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c162152ed17bf5a2fee2c9e1db230ac972b16baa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e739cdf95023c4b8a30973e690c033e8cf02a542bc7f4f79189978982577408b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..389a2a958e9a864ed1d5255047dece803d3f3dc5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4768a8371ae81a565d5fc02e193912348afb79227abeafd22a80ac6ae2013652 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88d39255f265359faba975d4d77358b524b76c7b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:760123e545fb611ac4abbd53893520b95f60b0bffbe3c01a9aa4b34e04b36030 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0aac630ca8ce6aa1d7e487f6b270acd48415364c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb21b54dd37fdedb945f41e2398f965c4a24ac942def26a871157bca032080a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da782e8fb4f25b7f338048e02d2553dff37dbaad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d30ecd71567bb4c387483823e488b1184aeaba1fe0067650afabacbbe8cff3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d012e1adc9aa9b223c9420dd068fa37d940a8a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11e531b3a514806365ffa138c7f6d4458ddc1a0c891d4f1ec48e01f03808f38 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60296ff28fa931160a69b1185a1f641c70952b09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f32fbc421896528a23b9ad65d3eaad9b4227da105a35887795be034056a97139 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ec2358a4afb3b249275b5efdff219b8f68cbb26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c56877aad1d003af64df5790e4595b28e7d4a33e88df64fc3314ca985a8f4e2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94061623b80b369a8f16879c17313a10d0df5e95 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce4929abbdd59960b5fe6307d3def6c56b120b08c3168d213d48922d4bc255cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b945683fb0f49632441cdb35822dd4e39650b4c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62dfb83c8e629ad804a41e06330e285673ddb6aa1d4cb505f79f26e765720818 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..558a4b4061464e916da860b4cd7e4cfae700afbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d753d417f3b955695bbbb769166eac28f07a9b765d4d805c828bf351286922a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a9e1ab1b2f61768f1f5c5461e768ed5d6ff3ef9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d2cf71e1ad82cb44be4dc389cb0e301acbc924a51e455f8784595db6c7faf2f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0956b137578afffe1d0609b146fc906c3ff7a24b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afa8b701b9f8536517a9b83032b71bf806cb196f1884defb9f33fce670952f2c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e501101b7b6527913eb547625d1734c1e7e1b0b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:515c33965ad244946c82667c798e2e1659ead493a738054bed26e72d9d588f13 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c12d84fa5c57e13724f8db0081770909be90707 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7ceb1140bc8977270282b32d2c03db9816dc9b1c4d389179c1df154cb07bf36 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f797645af2f86e73fd78e54c03c4234e7cee9aa1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:671807758ec0973d4ee4ddab50915ce888554415b0508594abe2ae15bd5079b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed8a9f80d601f333368df05403f60a21853f1975 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_8/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0bae2f4a508ccb0c37c656c8dfb297b5813afe1bb9d5478f62ec4c7289f1d53 +size 11395