diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdae01f6744b9dda1f2d53717d8f5012cdc8245f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8dc20a0c10ad07e42db91067a99c16a163aaf089f94e9c0f3858d7bb035130 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..851178b99a4b27ba2dc6ec70bf8972a1143fece2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10a584fa5a48e02489e5e392d1813d8adf36f28e148cdf5afbdcc39abfaaa52a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e43854d6be96b963b866557bf90fb134adfe7f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f0ef7a109ca580f16b100943dac8839028cf8333b5f56ee1fecb92160e6d1b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..041998fec7e8365c37829152f7acdeef10834726 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d23f2cfd40426b68bbee5058cd9a9a83c889d70f5990533c16d54e628364148 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02f75e5a84b4d9f68a7d032c3222243379879c0e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddf48cc51e90faec52b1cc4c229924a3f29727e907e90f30512e6da330c5646a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9fd75c1bfb85399db7316099ae1ee1bcee1f8ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b72c8370032207aac40d62c0a508a80cfbb0ddd1edcc9c246f4adeccbeb5341 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cee748216d25cd68c220a570a6a42bb4d5c34c60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08213392751565fbf83d8e63577e72625e435ceb37958557e5ca0ffc393d05c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..848d1876b107bd46434b978498cd2b8e22143dc0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8415cac0de7eda0f34ac041244f8fbc3f4adb56565c8b3274ac06c9f9861883e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..157bce8df62fb508d71cc2f1f5ca3e6ff5f9e684 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cbc87600397814f19e97cb67db26d9f644324b28f66bcfa5bf3ac4567e99c6b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d37d9be1516cc1b1314fbbe301bd17773a234013 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f482d6ed076e7357ae7d2e80ead31aa7b1c78bd371611399df54e917e67b79e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b8c8c14b89a5f5d359ac346ffe269d5b8104c0d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc97630a5e70c342d2de9efaa8bf18da092bdab6414e953f7788d8b93041e4ff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e15ef51f981f2c188092eab9ed88d57eaa8c4a73 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:771b673e1b4a4baad06e2e4de35ec6c721a966d4f7c502a62cc59297fa36bc64 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d498520c272dd6225e6c59c4e635d4612473b4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eefaac7605292b87b812995f6eafe159618beb214975e512589ec7464e1f886 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2ff7395db8f08a8062b62f334acccdb76c19902 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:551039478dd6a2b25207b9a815573473cdeca7acbc317a384f3a95f4ecce7b09 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e82e22f5fdfd81f159b7b6f91031adcdafb8195 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:981eb60313db1da6d470f05fc4eb24e394cc192c022a7c9166ee951e50b99f3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de2259da10bbfa0fe5caac6421e27c1787897e5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36393d4de4e3205129e80779c4c9ae869dffdc68585fda511b4d998b857ac10b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50a11f01ce25d1aea86951d619294c73c828efb5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea98bef389e97ebde1eb48d1609c6eaa1fa5c27a0cfd58de5799616761f110bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dcc08e5db7282a3eb1aebdbd11c94d5ff997a8c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7b990d0db465c7943664072cb788d92cf2125a4d17ede0bdbae41a9a30c7abf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f447cf402dcd104c52efa6a449d896fdc1c373d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2141b1e86d1fc3c08942aab863f454a39173540db97967e65b9a4572776112e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fbd8dd68b3b111048a0b08dd0391e5778a6d502 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d8712cab96958b30688636ebba631acca7c5922562f5b7950794eceff3b302f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9761460c52d88c188cf713a2a408b399d51272f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823193c0a169a1a525310f59e80acf2ba2b33c99dc9cef48b935ea13834b6379 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6fc1bd70bc87364316b55660a7bb3f5a19ca2ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51264df1814a624e3652243a69123019badf52470276e93043428df6702ba032 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d594a17b54486eda943d99e92b7def9eb68393a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53448df6d444ee1031062a94d656bfb1714c0a9a168077b302d0ea83a05e1bfc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a3fdd2232ca95d3932e9d3acfffe94ff45b41a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27fd194e0e8da836016c472c5fb1b9c022df51c53ae5fcfc3e0ae203d3e6fa92 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b4f904ac4728ae37ad5093826c93bffc67460b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f97ea3a80ee11c6747d735272bd1f1c0c5550b370dfb947291db02ebe70b84eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56b6e083f77bdd392601e80212b5046a4c71c812 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8123bb0f49cd40f03cdcf3c97253bc85dfbd1d7283a1565dc84721153ed33947 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb54f32ad51275c1a3a366f53f688f944b4a5f1b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b14c0bc721a7a7688fb9615a6f20ac713f65bf879557773591624a9d07861ba7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9103575c4b0ff77e7bb92f3acba64c7be9636ecd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f9e94c1677b38387886aa90cea71cc5f93525939f0a246c2f97a322bc8961d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..604dcbdcf4fa6bb03e2fce5e3ebebd7c06411daa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede73915bca083499c6040c7fab360694950da7b3005bad86252b4f9429f669d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..716149fc37f01c9b41cd8b4dc71fa822d352f8de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ebe7029e6de3d5cd6980102364376ed52f8fdd9e4c5c896c9f4b66c4e203606 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..412fb636da9028ec76d25ed66a6469325d130400 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91aa8990e50ed961fea5c015980a1999e2fadf414b4b6cf55407f31181b16b47 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c62fd4dbfda74f48dd5d971223a639493f4a170f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ea9907a0ff645d177d8a0b183f783e95fc3c98211501ae67adff3fc1f631a05 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4205b89006b8f33f37558ba04e096904855c58fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40a6227c7d4ec0d4d1e4d724b77ec9b0ad7dedf52ed8a434d45d5c1d09174fd6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..907ecb1681b8a3ac4b8e76596d9c1a15af82cb0c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30b657fe835adb8260d4911317be2167e7f969a9026abe152935bef311f9d1f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc034bc8291141ab54ee9487601082a4d8b5a2c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6024328fbb3b500e56c3c5c34e484461e79bd86e2af140c7ea59a7cfec84b2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffe7e0f1826b3b4606481be4791c32e9a3b836ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b83ba27950ed6ed7d48f23227acab26d1a49f170d7119d7bad8c273a04187d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8867b04cfd9bfd97257adf993a1747d5f61a155 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22340c4a6507eb578b77c7cddd060107e1cb0e3b573623801b3b3f54410967ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1da402e11390ac39fd63c6973896649649a93fcf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:487e9c3d24e13a968d899ccf09dbbc0753e5b0766d39865eb96ed91880585c99 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d9a0673ae4f96bb90b4687c35b9aa64915d7ffc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f0aa738d68932910f59c09793f0547a8a7ac54107a2dda621c7867504b80f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28289cb009d2dd72e6618a21d189c57355cc1eff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cff9e0249f1b1ff1c4b2321575f3b4a390681fae7a0e07ff6d71c57821ad121e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1acd8ea8bbd97b4814ee06c1c98d60dcc2990c59 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02120ef320730b6f576f59d40ab2c38ad1ae2b24bf9814ddb4f721082676f24f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97dc1297d3c406d26ab67ecea2c0b90bbd5f1a23 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:500d78483b0d1febefa2f07438ce0a1292cc6d3155a34c1f55260271c833616a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf74bea6378625af27d36b4eda4ffeee55fbfdf8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeee5b4fa45426c5bc0c09ccaf4e0f6f47bef936a9d19abe5e75f2ba4401f826 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b521b7da6302db1681c956fc64f708a0bfa480b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44487f75c105cd109de193cd509518895bea01445b2da530da531de3153d2ac +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a54387593eb8234d21e21a7b476a4fa931b69eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:959bd5cf0da4cf10466646171e5b7085095fe341df4e4366de765c79bbb7ccc2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..001b384a17cabf452fb363f7536cdff6b0352f3c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5293e49b80e89d9e2a8ab61a684f042c9b2270c0a608869e20d6a31a8b6a5476 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38753c4f506a472fd91b155932d574901f88d404 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57a486b50157b55fc07d4817d8012fad4a30517bfd959c4de99b9bc54f610954 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6522eb7fea72fcaaac781f4bcce73b687281c00a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:267d1607531f28f4d3518b810e0c43cb699cbb315e961e8a1df162c8c87a714c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ef71228363cc8fb8bb7c983d2d082ae0ae4d635 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31a91ce67e1ea8ae82b047999317ce6a3d2cbe08e89e9decc94ff78f5bf9c9c4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1491d4053c115087267a582a249b2aa670e28f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:737936eb6662fa4ad7c4d314ab25d321fdbbf868a1e32435bbe340690b766348 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..405e93ab9ef61baf16feac2036124b77465d71d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6bdff5b4b4d76efa7cb2bda930079048016ad01325e66c80a54467a28e4eddd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d7f94b526356badc8ca9d153cc069a20ef78906 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78c4018f1659060a3107df4844470c02c7841b2f59df8ab11946fb45db118a5f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a66815c6e23181e9d1b3a3e1fea4f97c0638ca15 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05b741e267d60e7225eb94353d7506a20f101db741310013aabb7b894b746420 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b504f55e34ac1fdbeb9ab99e6001b2cbd8abdf5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c139ab41e1db09c635d07b14d64c4b24870a1e0525aa97b97f1a9a0ee80e7fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25c15ac7635f00086ce2c2e90267be59c73782b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ca3682912778f8cb6afdbf511f3f7407756e1c2422ecd5aa4270fea0f14e302 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cbfe3b63b989a38a3476baebacf892f6de9a66f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e49b3983039abe506fa5ff23a0f40dbc045ae6ae95718ca5357b00ee4b51000 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31b68c1257bb4dd9c11b673605102ee2a8e12a0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66c7f4f4a7efa834790364b893adbba996202348b48b0ef8a2e338f73c2c41d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc60d81bafb4fb8307b8ceca8ca721ca6afd303e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3bd4a2c39b801dd179995a1bbbc64cc91a48a60bcebf86cc9fcadc63fd72b3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f58ffecc1b65c574b2fbb923d57fe6468f04cfac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8663793a121227194ab3f35e2f74ce6083373b486847773fef334b50f5e1beee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..918efe724b270b5b168b2d89ca80174c8b880cc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:064b77440d6a5d0c170c9762eee55596dd62e4328cc674153a0994945a94fa95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fe22bcc521d17f8579d14213e0f0145cceef45c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7da583e28e2ee13ba193acd8914a8f7a9f9faf298117402d3fbd535a05f2e8a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e45bd40874dbc47921f07db2e7ec8e294a590db0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1746131863384876eddfb2f5e4e1d0ea5fd086805e696682f17ea4760a093c6c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4b2a75fc48869e39f703f6b10ba7038b4cc9441 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7267f9d0a6d9d6c4899b9743c6f2101492c8c6f0092a4e5a79a0baeb02e443a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47e79504b5c128c4b476ed70dc1e98c85e2e3c1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a711df12bd611d1ffe5a0e9c16680ec3c1962da23b8c5754163c00a0e3e406a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ede333ddddad03507b4dda6de15728de7534cbf0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d57798e80718cfad068a5fa99b0ee4fe1a6d95179fc3a2eb819d10d616558b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e93f4333fa40cb952cbb0ba69465a51130ce213b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:636ae06f75c7e008205985fe4b1e5ca676a71284e62de6925ebee6c8e4a60377 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a75d0c114fd975c01b40e0c1c8505b7b7cdacdd1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e335e11386e56c449ff45904132272d82f7b8552be7e5c8db8449c07b52ea176 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9249f75b5b9dccf839886174c706a8248743833c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bc2b534c8a4279dd20e4c1714881a126cfa26a9584dbdcd19bb43c3f08d31ea +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26966a02224f7a677eff3515b3dbf057a502a852 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c46e3d520a8b364cfef4da8541e5ecfa715cec8fe9cb852c9a68119564a0eb4a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b1bdc6d38fab964e74a135fdc308106f7e6b467 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a9807b4024bae133208027fe20ebd2aa85a5e11429c1c564c85efe0d0db43a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d542f82818cf810aea21b3066e788058888d3f90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91c1192a1c3527a3729be157bf50e014e40a174776e337c0ab6700ec540aa64d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0061d8970aa8b285e0d3d435e384ae25771327c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21742398b15ceb30f95ac7ba62bdc32d3abf5303f750c8f382e431da4f3be973 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4fdfafa2acb05cf9b1696eb164b40f3b0f5f85d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ce46aebb2b7f6ea4d721544475a94da492b1fbd223707928b6dc95112cfaf3b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9857c524a929a12fc708614c0ac392748dd8026e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fefd6b354f646a95449a44d4bfbbfab0946e8969e80427583c17e1228eeead69 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..466e6c8a6095eefa44c85cd60b5cd09d2e25c55a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b5810dc8b79b2c288b11d357d11c580345bd97d9f7c07f78b7f43d41db70139 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0f650f6b595ce495820d626a4b2dbb4d49a76e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4974eea2c819bb6a9fd345844a8549359e440fb65738fb25c02034273d50aa02 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db61abc06c8d0e04f3d32f434111c8bffdc02faa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f557611fe5a1e7ff445d3a83e57b3fd4699e146ef2e01995ee28887c8375190 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fbb16e2db00c15c9382ce085b57e19d21b45190 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07bc315ca91653ee464ff76622467117689f5b13d826e371d8b9c0c680da4592 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44217403d6787f3c3600a1a7fcc60058bc36d1fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aff16da5009833f9a20332ce51977e5158daf5e14d8dab716e6791c080a33ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..085400e4f14d066c8ff5b4e108e69b979e661fed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ef7af6e4ce672f9435a5487d43e015c5038df79e35655a02e4f665bfaac2369 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eefa03fd686cf6be4560fd02e5ba794b9a244779 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91b2b4907b808e9e47a15b5b52985e0a24beb0d0cc65a998309345be8c2ec007 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f007b4ed250db417b53d9c39e671a102682d937 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2bf4f83e6e349bde6d542231792eab616e82078bee64c380b09a07934183677 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5731da1acae96c1f989595508890c72b2a1df1a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eaf2400f77a161b69864fde6a76503e0737d3a9ba6f3b48bf7b91569a6ceb8e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47a2de8d4655e2b588d4923855badb68452dc5d7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dda904e6eeefa83fb262b562bc5fd34344d6427925d5bd952261e6e6df2929b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..efc0665b9f1e09f19c35bbd2e1888a7ba6359e5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d2228133650a5ed5701fee7bf914a55eb979d21df2e4fd2fa94c5e32d6edb69 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..206984ff6913026332b6d18194aca611dcd0514d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:126f8952edcb3d674ab34459930d7adf731b4449af32167c1fc660148853c1e2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5018ff1d401ed0683e2a97513848aa5a97b4f3e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9070f71658509bc13c69c8a5283c3e1a342e40d912812565df93edc3918fc39 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f41515d6f794727b736857e8daf4aa50cd08e35 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40ba8c9e68817faa56d31fcc0d97e569a4a9a6ba89e8c344d8877a9fb96c6cb1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecf70aee688ea02687663a9013b8fb9dda182f80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c979eaf60e0ab31ff2611d8445f475930e29536cd6827840b7a946b8b506d6f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0a8cd112619558c0e2f38b060a4f4220c14d256 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e27a5e7c0d3b6c9727c0a71feacfceb01839cb652817c8561faccba79c9dba11 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69918a0de73d59cd80d7e9e5a4fb621e97607af9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0705aa7ac78d9f2281e5115deeb27782ae830f00162fc9a5bf1b6378946df46a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68be87d3b77736e1c8829b765be234959acefaa8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d9ee852d12e74eef267b0639a2729b13c614abd74d3742cb22cccec6b405c6a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..401c8c2f1331b9bcb36c5363ba7669a82d611401 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dcfccb57ed602211f4115d3795d7206972fccbf28a984bb0aa8f7122d5b8847 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..641476eeae569dfe08270d3a888e7b16b02c2097 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f2ea1dedb84d9278e092f13c5032148c38083583de3177b9deeb9d8dac38f37 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0efdd44d79719930bb469f9366e103fc8c6ebbe5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73411206e8f64125226999309110bde019f74e5da8b3b03706a1ada89d5396ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94c879ac706a5aa38b45237ededcf8f245cf2318 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:926778acec3a9177ebe934ccbbb4964d7aa91e469b40c3825ba42a5d9836052e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..459183b4f94cdef2b31dda208ea3a736f7e547ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:019be142dcef06276f9bc3d16636e98aa5c7fa5637be3ea8a79943f6c9569215 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5748c1d429a91db1f032b27f8803fff5e305deec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aec52e31208902bb9e39228e44506b035a019181349a86db88f8bd466d63b2c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9fb02d3f827f5a08f68dd7f7a82cd23b71dc0ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d93fa164e860fef3de34e8e758c4067f53100d88998cfd7ea18c77532a789abd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54da43e417dd9c38320653f8e6e3fce4c0303e9b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef81b22064e05b5578698fc6c04177e1d71bf6c00823ae5bba754ecd71b1e805 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e90b27b0f4aa9c2b630b49df6f7ced985eab521a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:729c79930d3c420ab8c5de10b49f4305ea872d2da3da9eedf3ed990c8da868d6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed886cd34b981d71a1b6eb9518db99096e95b27a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70df62a66c32193d250c0fe46391cb758e1d12cc60f840a97018c60ecfa59f9d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85762a74787ea6d21bfc9aa2358adbdff46e9447 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34679eeefe743f82c60d6d1869eec213e0fe5b36db2bf82a69f1285ec9e7f0e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7352f6ee9b3e0b80b5d7fab459e63b4d479ad87b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad0be94ff8f87c1d10be138d71702e934781caa3e091bd6cbda2d3c848413f81 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f87d3aa1a6a9f2b81fbee841a767f9d39df852d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c51d3508275cddcffe09aabe38f5b7012db3d49e11a2acfc10a632678ae1b010 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f1a8a87f41c137a261cddfd7f04cbf3a42fe9e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c17d5c4d098cab4b29510f49d972c960c2ee45fd9163a88e50145eccd46832 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cfa2375824e75416992fd00bed653a6cd725f9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dda5e071e31479ed02ed2ddc025abbbd2c271e5aa488209e94b789478207badc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d63070e4c84d9353e68a6ef6e2f75533d50f4df0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e76870ab21332d12578f30cc0f8ccd532f30c50f0826cc634c3f79728966ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7543dddae3f6bfede76dcd98032aa4ff6b7f3585 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85aeca4c4e416a2f6911380349476801268cad1d1f264442940b559d148273b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd1dcdea78701468b121ad871b81e652942c2f5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ce5ce98cfebf250673ba1f18d30bb78b74900e4072f45f07e6fb35e67ef5cb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c68c002bd2b8e8cf47af131375c9117a7b2837e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83e1f30286b97da0b9ce384d32fb7c16adcbe4652dcf5bb06f86fd65827f3e97 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23a52ee4e4b72136f9d163227e7785b0a9c09184 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ddbb59ded8d9334ac85a69bd10f7baa6b1e6e36e64fa1eb776a3e3565866310 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f8939d9e643279bad168d5d23e341205ac707ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd46be7be7436f57e8f862829f1bda6a5ccb052f8d7cb719e5913e239f851083 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dead7a3303652fd56eecd88594e146c7ff9168f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dd66a8ed770c718b0f8a80f02c48c07b02cc196108612f3ae22481e34306361 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac3607e39fa6e53631f2312fada8765891bebc94 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4af9388b641968fc574ad770974e9140abf908d296268994b88064401e980d18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..517cd6955f9182d075b402fcc9fb1df01f7fe9d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bc26371b48bf3a8bd6f1326e58b13a651a6c19c537306c6c3e2d0c0ec4765be +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6b3ea9297c0e233acd84549220d5d57e74e17cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e6b6fa279064dfe015f069bc902c0e6274bdaec1076c3eff8e6c3af632ebee2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..067fe3cfed1b3bb171fae1d777c1bf30be85cef6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb0d88ef73be17ed950bc77173755cfe999f47c910737ec4eeed28c8577c891d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a20213ef34ef3fd8d084aa4dda73cd6a5ab4042 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e1f93bcafdd27164fa826dc7af6ef86374e4542474b1ade68f6b4a83cd59012 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c74b902423c92be5cdd47e7e178e4339c9d4d64a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:894e46f6096e2aef919f7ee0b232face6f6ccfc24b08fe893f1db7bd1fe4f639 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dcbe83e256e514b137457af168a9cd953656c3b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:493c78890b8cf3480f9a8ca0d7e6648bddf24697264b94434236b7e74927853b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e114e2b224e351c33139b6e50ef3cec657da02f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5339f59e3a50c20c978bcaf252988eb49f790c168e989ef4d70bf5595153dd52 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87b6239e6660634407a1e8e1adec07a4e4b8c331 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:420b308d1c68803c3606e9cbe3eb03d131d95884ae8f377204917844e50ece23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c224df01e569858c189507fed5db2b93808ff2ca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9dd688b9054b2e2e8514aa369e9409f96f69bd1000a21a534197145afb3502f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1e71706456d9a43e24a523e0a2e8250cddbe9d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9991b63fee26322b4f80230e0ea5382d73f0d35dc389ec92abd9aeb9300ed399 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1b84a7265588c4a5dea9037e8916870ce53bf84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526dbbeafffcb81a54b8d67aa8eee446707fc50d49553e5f1dd307326b3e33f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee0165b085c9539468bc5ed6e7f381371058479a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2514463fb1293e3d4953259dfd6fa5c73a5cdac4759e759abe5099f8048684f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a233738f3c2627ac1796dec01d1f98a992850a78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16e36112e1848b66289a141462e6f96648b6ffeafeb63e6399ce7ed3dd69ddef +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79b50e0145717508db2dff1b726330e07ed0e634 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65b7128b55eeeee642f8fedec6af08f513b8ae41b40445847aa812cf1e285212 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a9872f9f46bcbfe7618804ea52960604ae8f2fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13de5066729417f99ba7eb81e0e27c6d7ba35fd71e18f7eb3f3e99d12f9380be +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9673ea920c2f62d0ba8c1f9171e3556503cbc7ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:108c7733b779334ebae84f32e3e4955027ec81f776804ec8d696c6a02436476e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..286531c079c24603756eb4f9d89d7ae516f225d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55478c16db95b8847f17d0671eff202b785f780944ebbd5413c56c0c476ee8c8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ecc4a9d7fd9da9dd9da9d9175b0c4a17b94dd80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53153bbb2bd266d7817e30c8f17f9e8cea15f506ea6aaa55e537b6258ed27e2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f27581fdd4961e7a2002c1b5e2022fa63f1afa00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ed935b3440bbd8b74f65d552c1bedc7e5578fc40cfdf56f600461495f442f9e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7da41a4e2a24a5c1664ea2940ed9c7ca5ba8a8b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e604d5f99d0d507c104382339c38537dea172b9986c2119d5ce58dcf92b7c76 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0575a5cd7ce7bf8d3f84b820ed9e630973383e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba735a86841c68d03912f650d3a979f905a4a9674d853ece4179aee815fa9da7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26c8118d9deab0d5fa0a791116c6b49ca6d0c7e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a474f8c20324c6e6502887988a55f971c54b923b24af71097e46f8fba981aa2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08dbb98f76bccbf8ba32c2c3a7e19b1587548962 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d6d38dae2f3a6ab6d7acb176121a7215434dab09cdf8c4be63bbbf641c4afcf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdea177b872cda9d28562434749d358c017f9848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c97d54d880c5dc62994834bec272872be101f39c3f87be1e6248fcad6cd4d33 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d47e6af0a325f06d9fa11f4c1f1352be6070ffa3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1a34bdfad9f93c6e4036e2ea8ec6707dcc460b5e8a7d547434aac16d47a8779 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74d9662a88f898b3f5675e1acd02548ca833b001 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:623ca7444f6dd41e43145c33560984f05c62f13ede66d192a7c85e0345efa47d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab73fafa3423200bac49178fdb2e937f8e8e0f8e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8366f6bd879b731e73bee1ed69297c43157bc96c18d45b8b8300af9bd92e4404 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e80d2596fc433453da9d78f92c4bfa8d5d0f80b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06e8fa9442f6b6fc84d311479720415cc3f80ffb14a11dc6fa297dcd3e7a3d83 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce793d90a2fadd676d9c6d835c79c26c44f4fa7a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db87d5b5a33bc961c72867ebbbbf6b344fc140606743be19d1389ac8ff1e33d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..529ff393c7bac85b9ffaea027211d62aa0e58aae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ef4a9f180c902456b11518dac2899ff94aa26e7ea7ca1ca4e2d1fb2019ce893 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e0b26d6e1dd1217a6d508660315d5a494241805 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa0e2bb6839a4fc904afc63ff73dcfae0e698f2f854a7be17039d15d84a5f0c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f58fb7696fc8f822560f9a0aad87bc2be63a7da9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4babf5e24e2098c3bd33f4742ffca0a6c9904ba67ae2088fca937c7c7a68986 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f8d7be1e33379a1565c4ddcdfd4773ef451ecc7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:844af054237f8470f0482119c5064a34cc533286c84ca2b79e603ada42cb7b49 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63c6d2a389b82a8730aed72cfcfbe7a8840dc330 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2047df07eca40859b1a3f69ca0ce5b41c750a3bc50549415a61906bc470b2c9e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1c5de09fc5647c2fd57325401d0d5ffa5519240 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c05e05b9fc8170d5c7ab2426d593300c257c65ba999ba02ea3cf814f35497d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6553cc1ffc753e2b07bb40fb74e7e511bc891de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:288d88f5f52d1d9d8227e19e3ea6d00422bd259dbe6115ab7bee07af5cd4e377 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77b8c9f9d855ad29e33264167f39f79b0fc9ac70 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7c71f5b9c2e57a525f78955792ee90ab212121bd8606b89443b515f6051a3f5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcbb32a8cc935ef315161d2da2b18045123f455d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30a5c2442720cecb0f978881aaa22a6e684087188f02b5bd318abbccb96728f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..133edf6cceb408b389a4ee8f04874dafbd528e30 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0b21413330a35f322009a61eb68e3bb9e05f0f46d9ef43fdfa78ccdd9fe5c88 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f428a0daa9f0dc08d12e2a70edf5bd34eb5b4ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5863cb008d0ff3d311c3a643f7cc1e856d66a486874b8b2bd9f10a44f25e357a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c59a0f3e9858f235c39cf06fe0ee80cbb12d4b4c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9d86937467d0f027e70167c93748f1ef293bc1a80404502fecf9db952e9cd4e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20e8d102cb327b6a9811d8478d71e8f0a192287a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79a22bdd3ae2c2b19d8e4e52710f83c927e5f0bd3896e1972cefc413e76e5188 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9988155158e73fea957b1803d0aa0ac299913092 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69e00c63d572eae8bd09d338fe9afe6ebd69c51e4c2efa7953a1d996b47b75ef +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c56ffbfa127c3a7fc40d8f3b964059016d9cb7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dab18996bb2cda70429828d26a0a60fa8d8d1cbc89d2b69fad58b83afd6d1388 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44cc65e43e08e41f52e522d3e3a765f5aa6e7a5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4487941a32ad0508fd08458c0947d748c15cbb47f8a43fc12072e2ea5ea6aec2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08c35f500b67c027a598b4fec9eff043f45ee612 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5219e1f2e0b0585e6a2f2a6f3fac8aa2d26370713542569d32af153b6b4ccbf7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed822035ec2fedc45f854986d9a2f0e8168263de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eaa7b612794f571cff9648f007871eda29babedeb05a95ca1832294a197e84f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29ccd9d19043ec886922a3627f21913c2f1361df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517602ee5b697191c72678f919707286da21587af6447fdabe2f1ba293167f51 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7045cdefa2eb08302f05973f02233f221b5f238e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94b011c317446d90d91c3d5d14f93e372a3be9d06fade9097297b5c1c6bf1f64 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5967b958dec4fa2392dce9ff0bab7d9fc65df1a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d460db203ee12939955a00d6fcd32463140b1dc1da9901865357703a0e6800b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..325a53d86bda8df2bcfe5d2a17f254c9ca820fcd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd864260183b9970d219f7b393b401b533ea3b71f3ed592ad706ac3197750fa5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d6815646ee914c20f33d8ca2a2e5b0f93da9902 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fe6d83c04176a5dfd34077b8ddfdda78b04f3391287b09d3f7a8b708904f81f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71203f003f6372c60e2a1e329ecc51e057f11669 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e389dd979e98914dae7fe66b06a97e4c591f0c16fb96735bf2ae0ef193c75e03 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4489d6dc2beb8a7ef716bafbe294fbee6c67685c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f215b85b91e447598b1dcb41e764b3bda91bbc0ecd3dd7f22100fa93d8fd73e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8da952eff7ba71a48e1b7cc898a1401c36b0521c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81fba27049f9850182af2c4c4d18d9386afe287a73cf7b554eeb2eabe0e4d405 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2f49c6888a1001f1509f425024f2200a51be1bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6b1cde2143eb0f0aa77ee3f807eb48d2770a7162dcbd3eed3f7418dc7a44fa2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc433f9bebbe5dcfcdaf2b8979d1f3d7e751736a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e64d86a2ea8295e252cd800c0c8019a4f6b7c0cfab812fb58170b6b36e81cf1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d961b60bbfa89c66a2f8f3be4a87f20a6285e753 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1562d7d1805b638ccf49503192406ed37bdabdd16535c81a3a65ab871058d01a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d860a81fbff773f085d6ebac734a5c5acbe9e40 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c7d37111c8babf788fe85a2f8afb7a3dabb192dc3166645eae3b24fca310dce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ef9784ef0ade945cc3c8df9d0288beee1e056c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90f39693f4d4558d9436af4224107ad453e90980cd146ff2d1a7173508983218 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e308d8648ddcc644103e063df2d9bb9baeec2d97 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e40ff4187cc861cf2980509a66aae95160670196bde8237259fc59e2f59c06ae +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6137c0425875476ed68a1a3a0f6bf798e6abd405 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1012283a3c6c8fa7211dc3ad9b1cd56acb7a05f1b81150dc6208c16f54bded79 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88095d71900cc7cb949aa7ca65b9df903a9cbc8e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98acd5d6d6c6ac4c111040a7cd6347f56fbe03c30e08aa26621aa90439b97ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..852725b2d65c6e8206b321aa060636e75431b986 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66a8ae0c6d2fef1ec5eaa773544f77215667b89520be7bd3876c1994278ed483 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd4e96c8c09802063237b140faa8b0d2780760b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7602b351345e58dbc8a3a3b51d45e957adb5db676ae9cf91cd4bb91401bb17b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..382171d175134ea82fb7bb4007f1554151b57182 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:416d568df22df1d370f063d53786af93a7bd8c62448cb664f5a803ada7c781fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af42bf59c8b07f00af41859c6a4d625a47ba494b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a77e871872beb346fbfefadb1bb1c69480ad1caa44635db5f79531baef203974 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..304c455c84755f07a9c15100e915b47aa2dca381 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83c34a6fbaf16e2771fcb3a5317e46623eed732ee9bfe9d5f13e1eb761781e20 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..349d94d6f863b7f8b16f5f03f73525ecb7d810ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc45f926cc82115893eba40742462132c58fa3e905ca6bd44a8f04edbecafc1f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9131a61896381102cd822932558d03b169edeeec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b183eba173f601480cad7c740748a1ab1c0af8e67c1e39d714fac346ee734afb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a73319eca61e167ed0408c49b772eff5fc25a07 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0acd04c0bcbe423e8e43c2d929ea095f2eafb1b7519f419d4b3eeb932bda07e8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e19e06d4a9ff3f1c3895d0b09f462cc88f93a75b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d134eb8c93a2532c22395c59f56f5d8c1c3c65aa512756cf9c7f87f8b5ca0ebd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0ad6518881e21bc061e7b8db99e4396a2c3a35c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb9e0c462ece0b7a6631e38e27f21902e95d1941b060d6164cec3ecefdda5a1e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..694f931fcf86945bc94ff1638bd8280413f7fb85 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:262f48311180d0809217c84c1f5670d555d22d2a40fe2bff1840c010407d2c61 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75063ceaadc9e6b5d98c5d3afcff85ef18092ee7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fad53065cb3dbc142ac3ac78f9dccc32d6dad5b8ec80110914bdd8c4b5091aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66b3890bb79b2b9216bc3195e8b253093ec9d161 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:605e6c24ea7cc235ec8829ad9801c944810deff56fe9bcf701b6148224a27ab1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..123faa95b42a383477ddf3452209e7b91fc1fc02 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd7641957bcb02fb4875ab77fca39f8116ef389fe3cbb182d179812f18cc2e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a205a4b2458feccff170586deea171772badfc9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd3395c82d13c4e327b0ab17493bb2f5e30cc61f4497531b0ec993f70293b07d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce6bc8607fbe6966d9cd5bfd593009afd79e2f74 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d9112ea5ea208e6d8327099d3a00506b577ced5a669069dfcb3b3b1fb0cc447 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0346b476d681db88dfa6b266fe6b623a1c7d281 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adbfa0c017da832e4414b02a9a01d40eb6d90137f607e8cb0c3ba03a2f2d3142 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c04c81ce7a230b6617f89dd61bd03458afb76568 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0e8707e79850177204304426f6c0debdb045e9f818df5f17adda8c29923f40b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b52d8f4896dc72046221e72b8f08792f40f13c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4793845379696aa7b3d4913e9677aec881600adb91cefd1ed37fdf5ebb5fc8f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a5eabf2fa891d135feb8321b8cb00603611a3dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8264fe11db1871c3221e846ead322520df9d03cc99fe8c8becbbcd36a7174ca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b8709f4f8933f1a44b2540353a41fcf4ad041b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5539353ad5efa4926d554452c825de98a9203f86065f91f8e826ff7129b89d38 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50a734d5fe452e60282cb54dc7722f40d66db4c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcb5cb4b952ed46dd1d3d0dadb7ae1ab5d4615e60377b7bebf8540ede4f72358 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0e87c77bc921bc9dbdc94da3f28ecb251d380fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d532280843b2bcae3b5f5082de8f187aac07e2b3766782de5b02ef4e9af8b8a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a6543f67ed87daa179e6ab07257fe538c8c0d0e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:889eab879f9ba0570b5953a0d240f8f960391b329767c5b3f553594e52967798 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45e7ff85a3d832341e2ffbbf556f03ba5d8cfa5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76eee7d590ed1d7aa55eaa241d7045b5bef791b720b74ee3efad3b0e07730bd5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f754891b8081d39ca63c37c25dc98ddec808381e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1302fd980185836c746147e1bafcc2296cad16a7a4a058a05e76f5916a31342 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78b7ca80bffb4685704e18bb3010faff83a4230c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:418c5b885f988e6ba6d5286d4dad9c3d6f98accdb538ba68e188452fec7314c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d498520c272dd6225e6c59c4e635d4612473b4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eefaac7605292b87b812995f6eafe159618beb214975e512589ec7464e1f886 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ce5fae7aa5f1e3036856680d05a438bcec630f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8382091f53f26e6622b2de4f809b755b5968115dc0cf5044dac43288236bb03 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f3a0a9c394906b0152666fd79d8dbff1b86b7d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:162975ed634a48d0f766823a87de72a2fc5448d5809d3318a1edae4852706ab2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44fd042d6233f52478a1ecbdf0b9698b3424a01e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c80141fe972c4f9b679390f7e9585651d452212665d6ce27238d192478f3233 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce3c4c50a73ffec3fec40c8af1d79b767d6f8b74 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:033207a1e6f64aea31eb1929c895b4ba3708d60f825e2061fb86670f4bd116e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3795c27a03defd544d41b29308d634534ae4b2d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a194c472d92742f426ed31a5b281a1c364bad1f3a89d26f1664bb573148d4a0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c94d4b5145728fe0fec0b7e6ad549a7437b483f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e320ed9e2ce4376e2b936163998de5bf7601b0c5d2ca6a11395ccec90eb495ff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78570550478f9294e2075fbbe60a793c193abfb4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb2bbe96dd73a2d11b42470dfa0461dfb57bdcb3cb248adbf270be81ada41761 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c18bc9ad3af8ca44ba23605da93932c8c9ce72c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f8b864bf96d51af22a9e1ceac666f08afd081bc85b073e10635114c7f4c861 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..114775193bf3f0c9ea25ab5ea7e8ffa57066059f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb48bc41d2272e3106fc073dff816d4f3d91a391754cc23fe0a5fd322579d718 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..026e5d1ac192516dcd5116ad0a83d1d3e800c31b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c443bce18f0d97f8314c3dc0cff39ad19747aabd4bf2e02f47d94e56086b4faa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..43ed7a79bc380b47cceaf7a75118958a5a3425ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f81b770541a0f536a10465bae43369dc17a7540f401dac95382d2ddd47dda2ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6befdd8c1a8e2f45606e4533040428d2cd0a5992 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f041cc03158daf0b1fb16f26e0ab03ce9af6e1596cdf13543ecf6ca5a10cb626 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..532e93d84705d2622dbc586698e316f4d7f7d2b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c61eaea105a71f9b63e56d172050c72f6162fbc5fe09047888743ddf3e1aff90 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94a1d18fa10e289d92439ef12368d2a394826bae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b35d7750e19c969bf8ded6c8899cc10cd7e33bcfcd02f8418d77dfee31cd7f30 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9103575c4b0ff77e7bb92f3acba64c7be9636ecd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f9e94c1677b38387886aa90cea71cc5f93525939f0a246c2f97a322bc8961d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a8d6c40a29335f8919493c8d81579a8acb8df02 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f94c06165cece8fbc85764a717534c0bca05ee9dc83f4cee21acb1c7c98fb820 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d1e256db532ad42c57f0d54618e61cf0bcb9b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b80c19f10aa651d86c0a07506852d489c62c6226b46c858e554e2075a7ec4e5c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84fd4675aeeb0d90243cffe7a62b7f05b93fb47b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30634acf3b83c3c4e7309e595292d9c6e05ef42e14c5a55d595ae8d8cdad6bc7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af1693b88c04b4dc321ef130b045939733baad91 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1fa9bcaf747bb6431971b68364982990751a28cd8f6ea2a3574c6972156a761 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ec27d74a79031cfbae0f452918f1d0292f3f933 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64e7c444fe1aecbd6481a946141ca828739b6d8c7c6f397e35b9c294781edeb7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b52dcce263d86eba921ef577155a38b0432f5a1f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7652826b44ced62dc9466470b6cf1b3e90d26c363ae50ebd0ba4f52847b11bf6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11d1e02c0466c570e9042b8e967c372d5afa6b3d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47e9054d8365bc2883080d5afd595073340e97acde02ea621c47f7ec4b819aca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b7759da44da1ab8ac43971d624588ddbf56f77b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:941203aaacb66354d437dad9567851034def364125ce3f984617df85e474d117 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cea80a3957bb20564d1934a58499a3f0000b83a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b5bd74779600b0edc560605a7e51d874e86831933add07c4e126412eb8af965 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4d781d62bb646902acb55e4161b4cfe533398e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5495258cc385b2058c4bdfc9771eba6f97d950347bb6d4d7881caa15d4bf03ba +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74648cf33d70b2067351346863c4072dc411a2ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a74da1c0b6fc04f15f0c25552bd381e287143e5bfec1dd255282c4628c206272 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28289cb009d2dd72e6618a21d189c57355cc1eff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cff9e0249f1b1ff1c4b2321575f3b4a390681fae7a0e07ff6d71c57821ad121e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86aa0f4077648d53aaaea9bc13d91683adfc06db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:586b427741b961801ec9f5bc5ce06dad624b03243df0d457741456b84f3b21cd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b86d50207185178479fbfd72485bd56142400d51 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96dc9978f2eceb6a2f78adc60f4c9cee2f836c33c28d231bae91804bcf4b4b52 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0f543edc49d529e47ef29e2334d0230a95ea0e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea42d0f112ac8ea1c8977ecd11e7489bd86d74272f7cb0f549189b4659178959 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bf141de6adcb1486cff2f12b4c1d2c1fe752c8a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd95be8d58680e6a068575936f61f97a0fad7ac9a393674c9e03e3ec34a6bc35 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b79bb8e0a5e3b95c9b5ccad4074d2bbebc6ac321 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:102a8a0e6d9d9c5ec16e4583131005622d618ce3d50e08048302baa8d2ad4bd3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..001b384a17cabf452fb363f7536cdff6b0352f3c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5293e49b80e89d9e2a8ab61a684f042c9b2270c0a608869e20d6a31a8b6a5476 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6721a58b942d65567ef0c415e710eb64f504922f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90765a95a8d5a8bf16f3b331b240a07d83c19853ed19d35a4871cb4a5cf0f03a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d25199b254e3179e1000c282e760836b1c626f32 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a469543f0becb6321c727e289084d0ea38d09dab08709d236267ff44c3656a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95ab551d7b32213e5673f59769189710013263fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a6c8b7a29692ab722d1f12d45d185ae3dc41d69decc0844de6bf5dd8ef7ddb4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..267353bce2c8e2b90b21970bf4c71e75af1df419 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:157b932381de92a4547c54f81a4fd9db0eb142c5ae55f49c47e4e4e940b764fd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64cecc1eba0eee6bf66153785375f88d73a4de52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0faa37c2e0aa6e387032af8bf2947fde32faa7bd7e2a11284e11f5a22ae2e53e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d7f94b526356badc8ca9d153cc069a20ef78906 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78c4018f1659060a3107df4844470c02c7841b2f59df8ab11946fb45db118a5f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bc340064fa842fb7f028157d4b35a4277fd413b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bece179336a1b397989344d279307a997b02d9fb840b4bd0cdf910f046f43fc7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ffd3da7c7ae72c710dff94463fdb4f40cdba079 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c916959fd43c714121e73be96156b52ecb442f7a518eae079b76e465fcef585f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25c15ac7635f00086ce2c2e90267be59c73782b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ca3682912778f8cb6afdbf511f3f7407756e1c2422ecd5aa4270fea0f14e302 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14b541a1cbc741c0ee863213ab3b32f3bda9820c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7573704e9a135de02deb5500e3ff7f11b5a0617cb89eaae4569631b11857741 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2656303e966a6eabd29082a4c13013850de83282 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e858d7e4e25e5145425ec28160f8535d6e74faeea01f7c567a4d925a59d6661b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc60d81bafb4fb8307b8ceca8ca721ca6afd303e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3bd4a2c39b801dd179995a1bbbc64cc91a48a60bcebf86cc9fcadc63fd72b3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fee05878d92e161ce53244e9dd8a05ef8844afd9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb7f596333dc33a7febdfb891345fcdacd998dd0678e785404bb8db9e18d061b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b82a8920097b9c949a16e6906b0f1436117d44c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f3edbb61cce16bfc97bae6cae84acd83497dc404fc226c537f5eb0e2f582584 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8e89c696562e830e153b43b504e309e8a74cfa7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7342d2c8ef621519d28f395bf95b2b11bf1a0c64677de7831b18cca8e6f762e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..721abb6f843d42c12bc6ee6c75a4e66efea7f078 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cef0753b8535a5f152327519bf489b639e3b7374474f7e89ab97ba01e9e35fd7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1068002eddf9a3ab3872da11351aaad7dc674063 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d08ea296b27d8ecd7669eeb7ceb045470ed304b2b645e7d3e1f1576c9704a95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47e79504b5c128c4b476ed70dc1e98c85e2e3c1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a711df12bd611d1ffe5a0e9c16680ec3c1962da23b8c5754163c00a0e3e406a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8911a0324f7b2f020cad94de5ddcec7578950385 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57dd3bec669bbc35f0d55675e852758b65682b02a4c3214a005e692e2292d6cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38141bf82f5268e49441e869757483ca0d67b5f7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:032601c18689d834dd02822663868676bae902cda80240c92adb08d983a47325 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af9f8bba25c927abdcca12ded22fe422f032d49b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdea57cad19ff1909145bd722454849875b4fd90f5081dc1a2a18e58e0422dca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c29f10c42f506ab97efee92457ffbbcde117cf57 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e65a0085253e14fea40986fa4576390cd9f5c0de281bab34c3bf7216b474ca24 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..315140c7ff083b6a82df0faaffafbeaf2f911124 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eec53eed13fcf7ed73336a58f90092db7ee469ad24aff27c3d60e6874083c04e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..342c5b154243179f02810c762c0617a7b7d72f33 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b287864f98548f2920036efa197a5bfb6647e66614bb85250b0f9799ac90bcb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8acfa998a1c1371a2ae808feb9a9602217e540a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9fdc96e5600e09840a364822bf32491c71713856436d1b50c88b29ebef5de18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6782f4a954e4b03358fc9dd5174c6435e58ed4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a52ac40cb82f118e674efb9e7b9dd71170f6bcb5042f44141635d224a227db1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86f5e5859e8ea942e5bbcf37d15d75ea0bc890ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e7e86460cc3045d151b1c9dcdbe9a0c5ca486438076ed702b54ec9e1b2d0abc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec2c426e64fc4115d161aeb61611076461c61f8e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b32f88c34f0a8fe55037a31a3acbb4ce0a66b4b66ce1090b2689b24f036b85ad +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ff0bddbdd61062e1bd2d9c452fa97ce7b0d711c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b8708ae7662394252a04e278a4f8d5bead3f42a88c4cd726731d74573ab5bf4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4566b1d360b0b0aa3ef5516a47b4b8d1eda21c84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da58e8a94b7802d397ca7dea1b731a9ff80114e239028d14373f240149bb2ae6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..783dbec9469f856472cf4d4e8ee14827cfd50daf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6573ebc0249b8794dd6eca5dc25874a08696a707b52767d42bdbcef31ceaec99 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af1457e2b8180dadaeceb113fd46a35687e27ae1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd97a6431a2e3cb5a93fcc7dde24cb779be2bbc7eba8f5433f0efa8a14e7799 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44217403d6787f3c3600a1a7fcc60058bc36d1fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aff16da5009833f9a20332ce51977e5158daf5e14d8dab716e6791c080a33ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b7cb9d3512230b21c42592a2828a94c1b60c791 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c55d64d55bd1b784afb68b94f958e766a4831c8c39183ba96b406450fb578bb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..faabf5897482d0855356d4958f5c9cfeb2661eb4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:925408f1fb1c573406cee4d101781611edbe242a4131cab85a8bf8f4aecaa448 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f007b4ed250db417b53d9c39e671a102682d937 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2bf4f83e6e349bde6d542231792eab616e82078bee64c380b09a07934183677 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a13affff11e4ae8fcf643b516cc895db97c0a49 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ff2fbb2e82803b02a7bbecf29a3ee69724b57ae6f3248a253ab077ab1fda45f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab88a96af22c4654c812ca4bf4c8f3365051d75f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:161b859e8742e3cc6fc8f24c84d9a1acd82769dbdd9c365939cd3669526eeac5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f71b4b2bdc13bfb79c8ca2939828017d95edfe1b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:773ef99c9532130ac80c2fb7cc07ca89174b9c7cb3653b8e6bead38169616551 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4e7362dc35d0c225bbd465b37d0ed6bb69ede89 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88ada552f003d05c4307167dd609684e8c0490691441beebddcea334c6ff8f20 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0412ee61c57c92c927c7e66f3368c2cd67e71f0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb28b09f262ec15e3a2f0ffcd90687b258cb4aad9310e63ce78282a73de4c38e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f41515d6f794727b736857e8daf4aa50cd08e35 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40ba8c9e68817faa56d31fcc0d97e569a4a9a6ba89e8c344d8877a9fb96c6cb1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e59262937278e4c12d05fbfb58fd4b734947a90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4a42a4812a359f85e336f715a1c8bf534fb34f0378cd67b187587fef45cfe26 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d98086b62d7634523532b0f4e52994e83bfa6ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e7ac5b31d9414957e88fa4d9ccbc9ece48585f9b5d71d27b781a1bd09db8ca0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f066213d0e0ecc9da0d8da6eb9b0b46a84ca603 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d509863cbab63dfc6db9271797f16fbda000600dfd3d3b4f53efb57807430325 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c69d27ad085726d09fe79bc0d46110034a271933 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:270a303958af7b319d467f11e45d5108870878bc39e16912002e6f5db373486d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..493eae1ce0cc7e7e88b93074c4039a1467df9a3e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b634b244ee73559de07655c6f83ad0f5813617809ba2d7f3eda020beea0fcc7d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0411675e66171818d788b39c72a1069ce3d462eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdcdd1d78bf7c17c05605ee6c581aa046256c48fbcf9ad89362c294f0fa11e16 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdd2a0a0ce62262c1b8495e6c4f1e8071e6f161b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7b7933d7f1f9ca4cf0717077981cfdbb4d9220fcc56312d9b67a9ed5a6032e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fabce21bbcb4de077e9542ea8c1a2c288c71419c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07b506fae57aaf5a2dc5b0b3c58a99ac64be9bfb12a3c3ab664878be7ad8e6df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..459183b4f94cdef2b31dda208ea3a736f7e547ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:019be142dcef06276f9bc3d16636e98aa5c7fa5637be3ea8a79943f6c9569215 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce2af7aa5bc5a49a0a406dfaa3e6399fb3f002be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd919eadcba5741a1017b3ff1909d2fcc224bdcfd297262c6fde426c75a031bf +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65f0f5433811e7be3f6301224acf5d4e91e819bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10608b8f598d2b0ffaab33474292618b7fdf8f75df69aa119a32f408c0a72472 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a8b2724c9328af923c1e0aee814c4eca6120e50 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11c48847755cb148e939c26d8dc13548c95c3b9478f3d1e3f8602f11d75940a4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b481e3b554c38ecde54bd3d2ac62cb1558ad0817 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2df206e94368a1a6fcf1dd2b86334e925ec6843d8cfaf54954b3846fee41e51e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02cf481e9ee17f382e341b7cc27e5dd67ba4fdac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffc0ef74f92c98e596da3d589df2411dfc758c2b4927fc32e5497ae2abd73c53 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14eeb12930c4339c5e17b3fd45f012517b80b002 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09b2a79bddc465c1133e03db1ccee6cf61a613861cad99d9377fad53556633ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff1b51244e26a117a1ccdd8a77c6527d78d31122 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:241e1e09c937c21cf161d6c37f5d44b010c390376046a51ea18edba21f23f087 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52dab7c108af32afd7d86f3ad7b48ccc7517c423 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8fa3caeac5d213bf27155090e870e98f2eb890080289702f01f1508f83f3f9b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2576ddbfbce4aa7790a7ba6ffb39fd8a6bcf56a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09403a9c24e6a93f176175fcbe2050553ff3b72214b1796e05d25c889bcec044 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ea05d685259e3c47c636d7c8d8f5f6ded6c63b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:318fa0d6d74a3283a725cdfb27207b0b576abefb708b1e8fbb8e9db066bfee82 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89f6a0704a6fff783c4bbdf86d5965977d70ffbf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e42c4c52f6c30fa6cd1ceaa26e23fd1f09dde8c5098e96acf60695e0ef6cd33 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7543dddae3f6bfede76dcd98032aa4ff6b7f3585 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85aeca4c4e416a2f6911380349476801268cad1d1f264442940b559d148273b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4823b01f32e3691d04565126969d6ee5e91305a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dbdc24a81616bd875bb9123a4da910b3083f258c3a514239793dd34a6074551 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6ec6b8d7eed382c03051a2f4eaa6e07849547e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c387268685e01ec0c088ab9cf2ca12a1a24872a2624073a58dd8b7a47d20c56 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b9be83944f3d894ad0fda7dbadbaa5ce409b895 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0122a2724b2324d9f15422289cd40c47f361db288245baf8a0eeb13d34095ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f58ed1f9d0575107165f7d6a169a004bdc3f2e4f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0b91cf46b75498883293e02c900db4fd63777d215b5a477ddd9b166cd3e52fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..856769f49153d5e943ca7cb8f68da80312cef373 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9778cf02a674d41b15419c6e9240a337f43f6d8a044678a2a13ce4eeeb5a1443 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac3607e39fa6e53631f2312fada8765891bebc94 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4af9388b641968fc574ad770974e9140abf908d296268994b88064401e980d18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42298b48ed682cfb3f05adb5341c2826e996d14a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3569d66209ddee94a840725f6cda74cd7ce30ab6ad25fcb8a453098f48dfcdd4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36390a80568cc61712808e65dc8f6a865ffbf911 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c6065f3b1f040955f33f46d439d0b08e5875dd48b3579e4e2cecd4c0f892e70 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcdd7ac065529ac038299d738759cebefb050af4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf21442d70267e9aaf848da752b305a28e4d56f3db9cb79ad36a78acf3435469 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..772db247b815c8fd9f4dc5efa7cfb747534f1cfb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10782ec3ffd52fa2fdc013dc55d3a504ff73050b021711eafa4c4c1ea557092d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fae12260ec10f2c2f844a5b99eb26b0e6ff1c7d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7da2e5ed43b0c2b99bc42564686c7f2f2d910a01ad51311866092a4ba9418687 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47bd1d1f237c917816a4cfa7ec052db04f1b8408 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ccfa746704d6f6c92762f0429c88588b6effd3f3652777c3bd8f33a6845bbac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1bcbb9a326197111b5cee55de4dc778433f3e5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11cc2305900e082f3b4d2b5f1e5de8464c35afc1eb820d9621951a3d1edb13a2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61025c3ee3356d9822f5b73a2e39d6263e06af99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:542e0759263b0208fa5c941d60e8fd659a8a7a00bcd4f5a56954691692af2144 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6ac1fbdac8dd2935a64a5b18d7b52cdb384d71b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:743cce1ada7db34cdce27224aabff7cdfaafc6cb6187aa358344b4d70a94f185 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a4d6b203615776bf4b2c7c16d548ba3192085b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:386d42b041f16a1a6ea4f715e0386ab90541ed16127ccef1267623dcb45d361c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba0d4eaa843323ea418175a446cc0cac8846570d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:100cc43041af36347b0977fa029d03096137c6b7d6ed9cfdcbe979ac9fdd27f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee0165b085c9539468bc5ed6e7f381371058479a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2514463fb1293e3d4953259dfd6fa5c73a5cdac4759e759abe5099f8048684f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d90008473e8ec2e4fb0002fc7d5ea13597b624b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7bc6db9912330eff5755fdc2f5236e4542def5e97745fac2e56d361f1c284c5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62cbea784943f5d27e2b63ca7e8acececce77711 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8d336b0d294bb7868e287f0b7cea3ed02a6a1bbcc073a7ca30a89326bca8e77 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83aededd6d6995174351980d168b878b66c3badc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:511dbadaa52c26476783e63d568a7b619c681894ee75973bfe7ea70223fa15f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a17aa6c8246d242e8082bc83ea51b5d8d99d2e47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0179de873a050e3323364e016084dfe75733ca4a7d9ec88cb587d0d6e8d524a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7717263b7515ab756ca788f83be410cb51f1d005 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d01b47ba89edae90ec43ccaf8b944386c97b3da52207f7cd25d4e16de21d4096 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ecc4a9d7fd9da9dd9da9d9175b0c4a17b94dd80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53153bbb2bd266d7817e30c8f17f9e8cea15f506ea6aaa55e537b6258ed27e2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd794b448c7098dd31282d148d916c1451dbc7e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70e561c07e22faac83a6a12414d6d792b1a2b4b3239ce8605caa07fe54d2a609 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ad9d7bff0bbf89d4c2cf5531958ec96c4c83c31 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6962db74d495d0a53d5e32e90e9ada4da7df276920e693f8753dbca2f9a33613 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73cbdc4920a4e601dddcdcbd2a76c23194e268b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:043886292abf17fcd49f9041b7dd8f74a109c963bf6d1547cff150f75fc7b927 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ab26378a6037f018a54f64080d8c3c8673e82c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5d4d1c8edb65847e77ec979a41a9ea857513556c551405e3148ac63609d80eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db92d64f9832808babe464127d740e7cdc5cf55f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbbb8cc327ad96ee76861050156e457cfdea855cec9f4a67e9ab852177ac7195 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdea177b872cda9d28562434749d358c017f9848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c97d54d880c5dc62994834bec272872be101f39c3f87be1e6248fcad6cd4d33 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..395b1b334ec2facf380e71ac2c2fae627b53c524 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fa5f04806cb2ad57f18b4cf803365b97a22ec94df2061597c859022b91e0bfc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e683bb44b25aa746d978b1571507d8c9638b398 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc8c5af607d9dc28f1b63a38dac020becb9be4dc4a3a5bf98ab6e67c3a810119 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9138643dd06bc44e9d8e69e2c557a58b6e916843 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:419c6254741277e53957e5b510d94116f445b074334cb1a3b186e6572d8c4a00 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6f0310bfb2279c389af35355e0c742c628a20c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8ae323d07e551301428b129ace1ae90cd100f937a7ea5002bf033d2cbcb2e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06e3db0ec3250c386eaa44e37c474ca628a322b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ca9f0a343b59974d69e7b96eaf9b8060d7f392ac44653fac0d86f8ab3d39b22 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af189b2c300e900a20883c489eec36f4c0c9dba8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd41dbbc530190134123c2ca0b2060bd8d1a5eed36df13d2f788eeecc828a571 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71f997e4257ce056151a93f80af8e3177026e648 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e3b66d1d630071bffa3b78185f6b01e6e4e4fba827b6f595109ca9325c8285 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ead419583169f6018f4c5a6377f5162326c8c7c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40f8046721ff4a8df12d41bdab18ba17d6a49016d921f8c9076865bcdf8e2119 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ca8a5082829367fa2a648284b60f55d57a3dd63 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:910871759d34d70041ead492a64ab6a161e6b3c3ba3116829cccb9aff666ab39 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13769e3e04c12c31a3bc98799aece12bf4b954c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:407c65b642c8ce0605488b5920c3c0cbc755827310439cf7e101112d85a24ef8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9238b516822827bb6c31c9f627eaf06262f50907 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef8c5dc051b0e853d10a0b7feea81a410f2f50fdc1b97ff3ed1942376dba63cd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6553cc1ffc753e2b07bb40fb74e7e511bc891de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:288d88f5f52d1d9d8227e19e3ea6d00422bd259dbe6115ab7bee07af5cd4e377 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63db3cbe2acd8d466f0370ac0e972c70848ab72a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c87e350a83e3f5d57ae42c0fd3516fc8595996ea0e20615e79576d6f2f5127e8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7881312ff5f7a0b41cf8209fc444682ebc640fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa41d601316fcaf466333c1cab451b520a76714ce7900f01f7642b5eb1f3e9dd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e51a07a12df4db7015957504cd9805f49bcf549 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d6167b2b92cdd8dadd518685a7bd5e3a1ab25821524157be331eb4e22181b72 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc8cc46a31ca6ab0f2e2328d3ef04ee72d15f71c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24de5557e472a348b4ab6a57294a95dc852fc8d1333433ff0974f016b7e97a80 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5af31730bf8f761ea636ac67720417b392958372 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d60f3e89b2bae09b31e45cbdcc5a0279c423207748a07ecde0416d7340fb37fe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..374db473011fad2cfef71c16636d1009c75033c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91b22e18bb3054b82458273937031a7823cc5df26ea03c0b29979b63c2004970 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ce958bb80b5438809948edb0106a0da0564b7f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:985a946950d11be5dc311bb7b03c42d66a74f503c0eda16c26e40ff4bfbcc058 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd3e9a071a29463156a8d14953aded6cb906538d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b16e49a920c9ad8ac2a2aea0aeaa0f791d36549a14d056eb1c2c37d4c147279d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d7424ec4397b31358a7b1a7e5fdb2036572cd31 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6accb086d23f96eb07f84df334caa4febebbdb320949b39dd26c43baf6ea1632 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f71f799a47f115c08f799153f47fc3e7a82a884 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:567861126afd26c0cf12458f369277bbc119e219b197da0cfe26f7cdabfb1cdb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..107a4c14de3639d2e25bca7ce19a344f7726e620 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0238066fdf56c12b9cd2527bc6a00860baab9459f4690b6053a99b48417ebf77 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f01c15313de7395d3b3b3189e72b7abac5e0228 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:150cedc0ce4a36b87068ed419beda9885b302aa9b22015d61b6042c0ccbb4f1a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2809d9d0c997a718a6fece64aa61a794ae07b43d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fef483511827add4890af5b90ed8acbccdfd1832b7eb101597cb17c838ae68c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65847e387e58403e8e528b6f236ad1c97f2065e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38ecf03fdeea16b9f2f2597e123cb2cf5559cd7cdc418ebbb7e7ff9106288b92 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ef3862a51daa7bc4c276ed80d08b7af31e15b4f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6578a02ae04e682ff207983bb36f6aba02d48355d2d183eb48fbfcf4b1fecab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0538d42d9e51467f4e7b2b61183c5a8cae9ff70 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ba4bb67f9d901542d4a33a98be4142a536be94bc8faeb102dfd3a2e5237d1e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..332071fe04fad4363a0843d01865027625eaf11c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70b85945e100fe99bc2c875e38218c840a2a423cf81d78e0cc84948a0dab4722 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6b52f0a82c578d2a830f990ddf73c373bb3d0e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96bf9c14f3a8e3e3efd9d1f128bdd33d1a37db4250fbcc9f181931eb49e1aa05 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5960c7d35328d555fbed0862d178bb65c0175d88 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0098798265fc567cbd71ae10cbf82de5e100fb2932955ad3e7b13e9bbc990d0a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb809369d5ebbd06a4cccba230b7e8293eba28e0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:086d69d8d7f8f028265e2722b798f1d5a88883eeac5062ffff3f40f774dd716b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15dc5597f40aaa8f9be981b00f29d39a5edadf8c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f6609adb5e4b2681f18cc59714516a25126919ba8ac36a44c279051f8839f5d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff7cb3a5d08ada8c29b9548244728dbd9ae6d2c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0c4131dbc4bafa0341c9227867962a41e22196426f9d9a908ca441effaec7e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2976bbe00cc45456e81d79f1915fc323846c57a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49500f99cb66a70b4bd3cf34e4aa0e3573f42f496e11b09aa1363f49f80f283e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c87fcad712cca1e88f46a9861964655054eef16 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:522ecf9402ecd4675e4d443fb55793a1bce5f6be242708257185c397f52867d4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a88c790c6d79cb376e8de123eb1023a1b3c727c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5af7bc55abfd5b004dd59d43a6e9e05a2b9ed7ed36ed80de65f8ff3fb8d0fffb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f259e0dfe30d15e1865d7a171632ec0940974e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad048a97e4ef784b4c593fbe297323d6114deaa44710059df06581a8bd4ab154 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06f0a4652c92b0075eab9d5675f85930438bc210 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3e176a355429a31b27171dea676f51d4f9ff71b08b4220e9e639152e91c1870 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2c96bdbefa6cea74ba2d5a57718575133e68ba7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:193a93a17da9690e909f8804d08c871bdc43415883482675e199518f0806a836 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6ee9439589759250a023544aa3f2d7250f4fa8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1c775b429560ada5aa41c17950f67870e6e0ba6e5a789eb6604f5f2386525e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0e1acae8494da3b489739dd6b6bf6c4af7c9d0d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f4ac7014733fe639b4a3a1b8886d9b3202c7827e958ddab655d6ed2866694a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c0a637e932a3d2bab9dbd6a3aa856d03c440f84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c4b28c36034f9734dfc333ee925f7856edb315d755a20c73b733783374cea09 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83e46675be2e8e5ed19adfa1e8eb437ef2187f7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bf258c8ef79fcc3c1e9dddde347829a91f95d25bc52187e84cf94065e64c148 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abb57fadc8566fbf60553e6415d76561ae38f338 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adbafcd06135a85046cdf1c9f44a89f4b5429feb094b1b1d6486e86387f960f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e8efd4df342ed25a292e95315891f79c2c18f57 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48b95c92d136dfcd97271aadfb0cafc7a4d175bf1c3858eada019b6b4cdf2bf4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eee48bf76549b24116db03fe4358d3bb4446406 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6edad33f84f59537d0744a5091045fd45dd35ef76bf31f73e7f1024974204588 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49e81b576ae392bacf68ab1e4ad797eebce29612 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9428f2e7fb84092b08c47b041c351c97e58f81405b198c2d63a7629e6576db7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86e5a18270b154fa4390a85f999ff883649d326f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ceec2424aa427a8dffd1709352b3a878740f64a7eedf535fb48e1532053348e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08e511347c8b902e9c8ddc3e9192d596fc8105c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:276788d9fae244a744905cbdb41b0db0072187a3dcf41b89a4cbaa68c9f17b46 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cec597f225edcfbca51c46369f565acfaa5a6d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72ad2bfa8377ac7c850bd306d12197dd6ac203f25ffcae2a9727a0890982e717 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76b548a5d8040c2ea2105d3c7f1a9734c275f0e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d653214c9843a8b9be63eac63cf33979d903b671689fbeb37d9475d9b0c725d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d9cd15c0cf88485b89a97967e4285126f18da09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eb0d0b44c23a15a1096f7b9540572d50c7ada01f6040c81d9459bab35689dd4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f117d97e1091fd813449b9521f265165394bd4b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_4/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb532e98d14720b3af200d51a264ac083a120a155c399ca3efab28385773af72 +size 11395