diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6424eadb4121b6d6193696c50297690abcd020de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0613c5da1d73e707f7537ab833432f9bf4d0e331d2790ad56ecf3f90f066c949 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75e378bd58b8cbd317e8917d8af6efc02c22dc47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22dd0637f1f26f4b1c1e5389ebd5b8c4e34408dad0dfc969f434246224551fd4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef6627be51795c916de2721b89d4a15fe002c6bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d4725a842b07e1bbe736228771eb92e875fc923b353823c5124ff03c72a8019 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..260efdbb23bb353a152e0895ec085cc6e0557ce2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e667894e9bfa6d2f2e897642ae68bacd0516430957415bd15db1dfbbe89792a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec10cde625edd7add7883688f85472b08a442673 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfb98f9165c78d24316cbb5d13b0bea986191ea71e376120f78998b8e0dcc3fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fddb67345b5fd3653dc64938b018042a459cd61 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93c9b64a4f02e091ac587173b8a1af4490cf86353289ac92332445128f9b8154 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b773d52cfd0cf1fa98c0c87d3ac68d1e9c005b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e1a3db66c95603806ab016e9d29a887ebbcdfa6de0686b9e577da36bb781cf7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5421ba6f26ec5778bab20155257a1472194a4c3f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543355d9f167b7058fed5164238738abf98555ad015c080d5ecae9dba058d092 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cf4e8fbe0e56963d502cf0d44595df0d9f5ad06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0108a2a4d791b9a85d3a67cdf2f2294c3313a060c0b4f19363fea12bf39ba111 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05424b4e8d18c5e1903adf9eb06a523a4a710217 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05fc40c20b2af3943a43e3fa2444aa47414ab7fcec4ab1041a8b2bdd2239ed03 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdf7790445605aa518b060a2f9420d330bd2f693 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa274a19a7f01649d2a33ed0f360608dfdba1a94b5d8e9a9003aada3787ad28 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e0c5ff1c4f5d1a379e0c666500b8bb3148e6668 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fc49e9f79fa5a8c4e62f2f2614ba1f70ca681fd0860f3f4b3a7a53c431148ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..becc926b2eafa07183a642726eca82b90434d8c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dad7ed56e9e635880f4cd2c48e2a912e7900a96148202ac7cb527578ee661676 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fac85a6c0a2ac93684b2d0c93c9cf0a7040ec20b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2744063fec7a3a901708bd27dac21faeaa38f9813a1f5442d21b6e9ab388dd5b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83d30fe04b5ade6b36efd16716df3d45aae91d57 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f72996c1e9cc61945d8a43da324812a67372cc6156188d872a232e8f6c88f447 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..969e7016988dd408c8655231796e5e0c9ed7a4ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac19c9cb0d4598a4e5430253890f612612120b2ffc37dcd8d16c792df8067893 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..970360f0dd6d81d1f6ffa3d53971ecb0fe8d3103 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25e7f973937a125e51344541f5ac8ba4ae6e9fd73271a325bd652f7d11a6d3d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7e8448d90d8fbf8317328a26030635fb253358d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f3325a089fe9f65f55a5811b4685f99cf4cd6482c493868075f6ace2b6ae2e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7c43deb27941ba87e3bccac4ea0f463e2a040c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c41d20566e8aeac8700f3ce81e0710bc76aa0b8771035969dc2c5ee1f3863ff9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..afc65b5d0bafe50c9bbff935fb012253c52be5b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fde3a4385e3abd353afb8177f9e416501ef80b634c2c9299049d8ba3faf1e178 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea5c94b7ce6e1b1c591dea94935e35d27337dc25 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af1faba0083d93476ca31ee820e2422d7331bc8df8ea7fbbb18adc4769ea5545 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eed73a518c558732b2e9bbffdd5d321015d731e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a19488415b1256c66024a7ab923924cea3189b5b9218672ddc8e84404a8f00c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdd12b3847490f1bf875496250033d1ff8123124 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb6ad6b51f6437312d72ee1250430a2e6370d68eb94883659ea244744be8d4f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce5d46183c6a914713a3c7ac65e1384baf57c3a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a303939dc50c64b8c4896502008bc6df8053f0446a96f494ae0a7935fecd639 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d1c480ed0554242c04c13820e5c578a731ed6fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94dae00e7f65e8f709a0b17e3d4c731fba924583bdd100f008fd3eb60bd11674 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5d42e10df6a7c9d35bfecf61884de5b548277ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf9b1155f5088616fecaa96847f2796d2f162c4314c58ea4ea957d5aa6aff57b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9bab02159341cfd173d109426371990f5d11e23 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8642ae0618d97138851680c72bf025445ec5f18bac7e790183a04b66c028c87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e830109b95de105b5a8b942e8868794d5eb01c54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:797e787b6a03a9f45778e46aea957aa1d7818a82e5337d6659d953f82ff3ab49 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..effad300802ad7f8084004fa6157ffc18550eb48 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40015033efab24921f0fa3bef686b9b0c49e9e6cada85a9e48c7be3cab56fa07 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82691bb71d71f85de6dcbbd910065c01c736e7a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96af2fcced4ba621def7b2cf63a9361f5392b8573372674afb500bd49a90f5bd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2f909c23c5d542ab96c88e2401350376ca64e55 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4e614966309b505bbe72b8a283c84e4e9eae3f1ac884cae55d34d512b67856c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..843ccf22fdb90bc0d25286c3aa8951abd7b255f1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b03e1f1cabf9d44a774d00523a9630e88372be0f47c418a7893065626e68e45 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c56659af5bb6932ffcde9d9b44c4cd04aac67e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5843dc60b99fe07f829a09799256dedde65e6fe0b52c43ceae1740068ff6243a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fb6b250a841e836ee910748114a5fa102d88873 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba36306ed9cb03f400ffc2c4d7473eb408eba79823eac86578d5f2e18ada018e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d475799c27b4d53ed1f61551b69c1169022b6db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:522112dd952c42c219d25cb25ddd26e3a1761758f197bb4532bbc5be5a9c5331 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..440e1276a7830207de2a7969bafc79308b812730 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adbf879e9042ca074e1a8ba3cc5a5d1756616c133e5ab59135b457d3936117ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..405ae3184af650650c5405abbfae4be746e9f48b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f285548d9c6dc24eca2a5ac2bef372eb52055906685c3268494fbd54e13b0507 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a59cbb5675ac75d237aef7d08a28fed121d5ae8c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6878875c71ff5a84591e1386323e0556ff5c59a59e6cf85bd6f7e254bcff0756 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74ed932ee5f5def3f50d068c2e9a2ce0f579732f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d6a9b4bde1669169451ee2eaf86b7f32abb773e5a2b7a461f9f6c7f6fca3b11 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f33289bd0ad5bb7bfebc033dcea430b9757a1e17 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:217dac1b20db280e25fe20099303da8aef9003d01e8a2e627a5e7333b7943aa1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a738827e80dbb17a77b598bef4433b13394574d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aebe9b2d5423698f95e46c7d18d90bf2f8268828032ff737aa2f11b18e3c2d1b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54a5e8072f1d4f7a1eac5ec9d70c79bbccf3210e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a5359d0683e15e934b9e6d8caf88876f9eec373510381d389c7c230a6231278 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d2f1e293ef19922cbda710d57904474b0e862de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8fdffa6b60fa3408490632cb8f85866ce6fa047472020879b4bf7c42d39ae4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e367675c463d30460fa8c01b0453fbc6dd157b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c3b2f227e4da1867db81ccdd53a3f268b4b4a766189a344f2c820f160d29670 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e985ba600b72820dd05c6331be4fc7227dfd9138 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8da8a6346a0f28896b4720432925b00f03d225227e0247d390f40ee5db7d13a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00c24336ddec44144b585f9ee482f6acb84af8cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bb01f536b3eddef5b2459183ae18a4de36d91bf39525fc20e055394bcbe4ca6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84f4ec7649f39c46a96d775b4ba90854d5c6c2b9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a320a632e4e70690833abafcf055a1c67953106be4fa4b30e9b28f9cf7f34283 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fa0e899c42aea8c870c9860230d11238b31079e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e77ace907dd4ac1b36ea02bb068dc24c8e13d1f6d372e7b7cc4765c7ee2e5ddc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e1cb6d2451afdf4c79bb10a6d53d1767067c80a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dc346e7dabed1d99240a0cfcd18c364b8da8a4101ac2c760555495573c18f6c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a795c6e82c60e4c4dae273f865f279578fd03d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2189338494a9bff0538b9128674574ab4b544bc5f0873f6d6a7efd11bf0e7b1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f42059569c2a13a783822cedf0cf0be9faf36165 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04911e7702c0534947ea835e7d17da100a33701a3ae1f85c2ebc553af3d6441f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05b7c7a139439d585d44f2525ba066faba7001b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6fe481569d73f6fe8fb903b564e2d3e79c35a2bcd4e3ee32420481c6074ebb9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a74f80d02fce5a8e02dde8d4577b12071b297e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b527b32d436e1b1a90f173f6d025f57cce8feb822854218803a1df675bd67b32 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec34b0dfc7fa247e7eba007cdd237abfded9d043 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66e7ae0a7b1f5346fac20988f7578811b14443edb7a6b9f5793ebd1d607bac51 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97bce619fcd5e59af9fdbd382ec9ad73b4201ebc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a15d4c66f5e640ef23ef01bd862217e5221ff7242f2eaaf84086b219b7ff918 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8096a7c14df783a8daa900818d655cc9b5ec97c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c0bd9b11a933f2e4dfec7849930d2ac697640ccbc2800ea7e40195e1c53a027 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..538125f2b5dc356b33dbf194623b2d994121334e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90f72653d24d569af1bab745ec8f55312d80e24f64c46cc8b597bb320113eaa9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fd559fef7f311f904e4c32eda327778f044f637 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4ddac61d9dccaac25d2c9a807ff43cf2a040686e6e47e8826865b1a37a1db31 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2b6738ad1af663ded19899b41eaedbfaecf19f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef90aa5585dda98d60d6c40b3009d44ef885f0e3d7eb9380a69689f596a9e18f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1b346c75a8d6f6d20c55e2c6c45b1ba23b94438 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d33250cb027286c8de3cb36f18b644613857af497d69586d30e3691bb4c680f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04d5b47685cdb33a2ade85f73d2b4ec6fc03e780 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d04e55e4860f31e9318113e6dbada6730231be190a1f3266588580d085346b35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81303cdfcb40159f2bc777427c795992efbc4174 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e5552d626fd6e71505e3691d93fda6ea2eb49d0a47fc523cceec36390b6306c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cca7e065ad062c5548f7eb2f46e9861f62d7f6c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b8119d1be8b3a4fd81e827bba4ff1abf4bca6f5c9634c1c31ec8e523eba4054 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..804ce95515f940d86a85ed2bebec56192b04bd88 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38451b287f49685880371b54796dcea36606807da58595b8db6e9b58c7c16cd4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9834fd2eba6ad7c3e9535e0396ddac44bc8f08cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:900ea3f5d581d02e9ffea7d74af0989b46c35e3b243f01cd80b3d6e1d11c8c9c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8398fdf5af32d059f9a5cbd49e1541a11aaffea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:470a31a985da6f7b15cc118c10aaa721ce5679041c267043312139611e5da03d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a05ffdbbcb3955e7544857d4f4d44035f597e32 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd443301399eda8686e7e2e0dd4151eca586217a6bf4d0b58b81375163c5467b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78e3a8486697035204cd871d301c3aaebe8f9ce2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fed5ca66861bb56ccaf60b66c81379aa6b5053ae5db4e3acd417d2631f0bee00 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34e0178f5af71e817489b951d9a8914344ebf2bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fcf1546e4f20eefe87249f7ad42288c3531808b645a2d9bfade3bd49b29a96b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cdd66514b9ff6c9b0acec64a3ad53a9d97a6637 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da30613c1f889039e08620886b42781fc4f88f713b7ad63562b64610845f6849 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a8be61f4017aa447f03f84c7a7456167f2e42d7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caefd907b97b7188587f723fc21ff8b621facc183467e177b42ad440404fc1c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa1fba967f04842346b00106f8cc98bc44ece4ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c949e82415cff06bd21ea72bd41f2b4ef9b232f6c577d38f0852e4bdeeef9f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f46e48ffc3093f0457ee131d2b10692f41f584a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3649898888081062156b3633d7fecb883eb13a28517da9820da8ea3fd57688f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..441bbb9f97e1ba131b09d53b1fd9dce4ba86e91f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdb0f94aedd9b9d6d392576a31c91880fe17b692c1ce4c9657c2304a9ec375d7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9af898a45d70f2abd8261304228b824f97e23835 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fa08354f5f6c46a118dd57272c41c2c0da9a1bcd90a2f1ca39c76746ecefd74 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a29406843a50c19efab282a56fd17626464383f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d43aef010af5a26cbbc2eced8dca34f53efd3e66ec540f5d8a68fde30947b209 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bffe415787ef37eae2cd2422f10cb0f18aaddf0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62a5e2be7ff58bf5c17b6ac1fa5c3e56c716abc2d4d0e75a4a29c8ce3a785b35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bc0cc9322883ea9941eb810a8ce5d22807c06ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2540c8a1c3e0c5ab32a30ddcf61d496c215554ab66f84d4283005e4296ce0ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9687d505c0098fef6dd60a4f908e0f58c01643f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c943ed687585c779f30e61a6fe54183b3cff449ff40e4f636e73ec0fdc6bda48 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e5791008537ca7cce2463f624c4f4d3ac692b9b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9733626eaf6ae2727cf88996aef7053e8cba27c4d17ad5de595e642cec0a7e5e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bdf47d432334e7db3fdf238f1d39c62a8e3ef64 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f456a48b396346c77e9712a2b6a3aa6ccf32bb077024df849426405635a0d9ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c16883356106d9a03ccbb7a1f10226bbdd32381d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29ccc4a29e9b0071fd8fc90bc1623531d45c90f814f4092e1eafe65a7b16686e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03ff53fc834b9eddb8853edf84fe6011973dffa2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50e1aff530d12ed4502e1b77f4c408ef4d54ad945d50a00c009dad280945d34b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19e3c157b7a07f6725d003dc453cbe6be3d2f0c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63020c407f49f234de9bd9201f09ff6376860317c3df0652e7dcb76aadc7f8dd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0eaac2ceab845c904519f7f2ceb6baefd407cdc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6c9d5848c805a5e6e50bba969e52eee142d2340f7e1d8acab59faf9313daed9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..158309601befbaabb27078350115972bbc19e5e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeb4dd667ec16596d2740cff57665b815fb5fd46848f3444236367e3c6569c56 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..869cdea4344dbcd2a20b38625cc96bcf990d1e25 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1fd08049b6e1fa31cf94b4d10417bfcdec69eeb372c375cb42c87ae8e7b598a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd06035b1f806790c2a33f89b492c85acd616fd5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dad41ee8fc76a5b6c8d7fa88b6bc0ba509c2acb916d9372578670a3e839a03b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..afcf369771ec0e0c3b29036dd1d323971e4400bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26d1557a321a99add075560d85e91c385bf6c85626de14c84c168fc72c5fbb5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b153b14766088a8518ee1c968f58570e165b04ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2236ccb7a88a6e5ad7f9c7aefb136b9acc1ff43cb7b0d8819e88397310e02d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4944c7b917c27ab5336f26cbab7f9bf626b12e72 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fb7111860664fa4c936bac14c16f39b138768a3cc05f4d32098b15047e40a53 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14b5874fb75a4ff46a0a494d6eaea5795c550048 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcfc24d1c1151e62f4b6994d65c5758f78b150e4fa1c400ac68489959a1b4c3b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa725eeda3dbdd3aa69d8a869d339b9a1642d596 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f53cf7e1f89003de731cbdb7005830904a2e6bb90616c226d25be17e09d29ac7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..547e1762f93537fa8cf6e9338c27c5989f687acf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fd6357b610321bec6e5c3add7f10919b9f3feb67dbec3b82b47302a51409dcf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5828f88dd3d0fa94081ee286f65740075dc11e5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:918ac47cd040ef723789e060588a55473d93e10773a06704f3f74e2edf5dbb46 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aa5da7e74b1d7ff92d81b07a200dcd94868b8da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4dc211482ba37f81dbe8e41003d14db27701a0b78d9913d7ef744afea9fa1e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16c188ab03598f9ae5885959add938f3655cd011 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c25c7648443d43a762e11462acad8eb3cb52944be18115dff5131936754d1b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f5a3b5d3d89ce9291c860b53ab94f0a40a3cdc6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00e9abacb1bf692b9aefe87845e3c9a354180cd29cffb1ed014536c00ad913a0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..030b4708023c17728517528792192e11480cf53b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46c165a2c8f1fd1f1ea93524954e5f4f5f77c1fe6228041af761cd46de12d77f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c859f9313a2375795c3259d81f86c5b44b929f36 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cda64c8a86b22ed94e3c924dc976d23607377860a5c07b33fa30c39f28a327e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..807eb15f80249cfd0b71078675dcc80af8c7fca5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4928f66bbb0ffb8aa4e2eba10a78230e7b42ff8f192743af9aa3e60e9de2dec0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3d1351237732133e55dc468ca9deb1ce7ca71e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:590360f62fbd4ff5c8bcbe7693a29105ad2d20d379041783900735c6a2c701dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..023393a2f9980b8c070be751a3afaad9beaf12f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c21058c119c6c3ad7d5534b46cc5b7c6f0105ae5f82ef73ae4a87cc37b6a679 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95c2cecb6cd960711cfde152dc0801e43e220bf6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:298cb49eb4a6a0db1d15fabb27bb3f53bbfc7d286294dd8e991ed90021854c64 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f908eb0f90411ab4be23aff6a60a46010f257ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29feb800c303dde8f4d2419b58561253a87f9910e9878decfdc285dff7668ea5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4839ded2a794eba9c0bc25cca6987b8ab0bd296f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7d503a7e48afb633289269c2efd3e55833ed3e4996e0178662f97447e08bcbe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29394234ca4bd8c28edbac9ab8f82554006c71af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f7ce2a59d46e734e0b45ac2d2194ea66cbb09cd2599376d7c2541f5825b7ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47b2fff313e811a826494e9967c1957b45e6dd13 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:492ee70d0f93b2e0993b0e64c9fd2b949e7d6d2e5bbff7401f50130172a8f00e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ad344a9f948833fd51256a821588b84fba8ed19 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef7f3e51233269e9c9d4840d5857e5af2d2d8abba8d99ca16842f62dc15182ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfa5f766f8b33c02a1f298b9c9c7a38c8665870e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4461f77a0d3e4c5cbc21496aa1a5cc035b4cb5500c28b81f82acd7c95e8cbbc6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63e8f6d38f0236118e946f42bb9faf7f7e7cba34 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0fde155b3251bd974a9d8e55756fd8c7f98b6691166335bbc543138095a44d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07cc221d632674467b55cc669b732c50c04e4e2a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaf8515cb291206710dc2f8782e17647707d590b5eb197ff3dd06e3a1df8ac3b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70c821275e085fb919f4cb011c7162256b570c2e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcdf281c35bdc0e77968a2b0cdfe7a9df39469115f22cfc5db5e3e6d72e8357e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd5abe768bbe5209ba6ce540f10e915b1e030e41 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e06238a58fc5ee0857b5398231d59a005aed7379157cd710b3e0eb8977c3f9bd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0521daa13b7bc546e5cecc40efa08413939a06d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0754c96eb8eb94b806e34bf8a4d82caf042b5fcd699107cfae9073ac37e0c4a3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5023929b9cf861608a98a38d62971f3c1ce809d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6feee3d1c18bfd2c8b46ef0a411d769761e422a1e799b56202102c278c188085 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd6335bca099d3a0a5f9865400c431963e789b3c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cf28c5a8ee6dc4ecdf66449ecc752f099d4a803a3b89007f67cb606587c04c3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abef1dbc91f4427cb6d862ff621e74bf4b4958a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44f2169c54088740cb6e5901e0dce1c5b0048d5ff5993d6003b37f42855d58d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e667de565d071c95916ff66339c76526e5155c1f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6efb08afa48bafdb437a466ba431cbd799494ca58e738c8dd325ec82c07b8a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb166dbe9105e170064c1b8ca895b780695b5086 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87a6a94bfa03052e413248ba31fe4ec1a62d7ef23688bc83b77cd062972b5690 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c633234b1c75c519f4e65c5319ffffe92c9d349c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a08d4174cc0c8c02009b992658da347e476a697fc46522df3c34899be0681e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e41cf4958ab7e630d90e4f827e3d08ae35ef3fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e31eefb35cf7efabd6f69dc3e7874fbef6d3d3f96daba4d49e960083dc259a7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13d95e9472879f0def4337bdc50b8b36074d25f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9a266239a4f9b9ba414692cf0b3b72bd29375939c18622c6e7fe36f6c090609 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f67fde189e92a526464af9ad23b4308b5e5be46 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7cd595d8c1565627b66b2e35643375299c952b00a244f3db7269cb0a60055dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e132b3155699eedb32100cb0ed70b8681c0db398 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5535114285df5e9bc371a8022c2cff7696d4ad0b67bd20df68bd1b7559c5c3cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..815d02f9cd87a8ccb1bbbec92a46460c68390572 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:163edab838950109a5ba1758776eff069b7d3ffbaa58636530c223feb189844d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c512e5f6f3b1871272cf14294eb7b5f0834c04d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f675fce5c5e6fbc0ab292757b7298f5fb93a1b72c11184973a1ebb7dbf598af2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31e17f7d056c8ef0042cc56d238b30990bc10e29 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8d68dd022779cbde0c716259af8a28276151ecd29d66611184bbb572eb27cdb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b0d317b9a6604ad10ed30f46351cc88a4aaca03 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:459d497143bdd8459fc8eb186a3448590254f2f91c956e825bc4e8b5aa9a4ca4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5e649c8da848817118574bc9e94ad7f24881a19 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f81023ee2d56227c55b26e920f94904773a3de633938b8d46a6ba0531a0d917e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16d5b48c578fcf8352641f52b914f6d04abb04bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb40e78807030820b5a3308d8cd374f0632a9f6b4d8bb060ba54ca08c42ed9e0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbc39852846b044c00482c509258e171ba49168f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa91ca3aaadfc177a9c0f52dfee93ad351240c4a47cec57a281559b2b76f951 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92a22cf0d7dfec746e635d0981967e60900911ca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:781143149368f7fa8371fad18763df5a80e67d2a49955e49591a169a4078320f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe6edba3260ea8568abbf5084f9620279c145840 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50e1128c07f519e08545dd29a2ddd222d8a1a6092783a5b8f3b84ff0d732254e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..037265be0fd4a831fa6404e97e3f553f87b2e954 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9b39046e8bc412fadc6fe3ca8cf158d2308b155eba43f598c84d06d936b3e29 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d7d80560a46469892733988108e326d472a0666 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17591ad9c4c56c0c2e7224912ed954c800891703a3a4fbe894107978f0de6453 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf3eaa40acfbdf2f0893e8857a05ff5fa6647d9f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b548aec5a1638107f923c79b9c2d2874d455e922ca3a36f4f92ffb616b7b8048 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3528177c5106c89cdf641d36608e822ee2904c42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47b63b1587fddd56c96e8633d34eb1437692f3bbe47d7548c0534ff1a0a7d0db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8166e207b873f83e52aa53723f5be185b3780f67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccfb1125071f2abe58630c06e95ac9735ef6d4e1e541bd31e527748a45676e95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fecdc8980cd4f233b41efdae5fc8b81e47c7dd4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de9d224ca3f2219da7ad997f0dee9ee5ddc96484aaebdd9ac714302161b224f5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a21e69d60b973ea6cdba501e0f31850caafd960e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c69aa34aa225d62d37f23cc2ba2fe0382e86dbe347f08af818e5e914e15dbcc1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32db21f39503071574aa0f8f314a7610d95c3f90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ca41d54d1395d709e257468ee5206600f5727592736f7d73938b5f88df5bf80 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50570e6ae559822bab2c77b14d9027bb2fd4894a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51ff2fa533c585a94dad11582934fed29c98f689d4cc987c7dda0ef937635235 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edf31687c6987807b46136ac41f878adfa1db12e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa667c1c4be873fac528b7ad66ea1bf3934e424327b17a8c76f0546849846a58 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a58cea2608d3a1e2353a636fb2ace4f34984a4fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bf8027c09b15644e1da5056d9d76850dc135546e08652d21bd3babc9ca2ba54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f18d35158c534d752ee2e240bd527c2542a2008c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be4744b9556725912fd2a9bac05e9e18368cd5e5184836c07f06d31381dbc84a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b04ce827abb02253aacaf74ef49c23251154df2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b584cefdfad0ce1b5fecb89e934f1801e89b2ccae60c1ce03224c3271418492 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b82fe60cd322989b8c7fb965a6f9e8d962b4d83a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7298912a4109076e4e4787febb06f812fa77a3458126770b6353e7ea71b565 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00b97ad26d0b53acd25a7ff371499f4f06b9be31 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c40012139c244bf05fb25b95cec5aabeaf4dfa6150f7623b5b16affe816b760 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d986036c843449f4f1dd839e4951c5f4b67a2b55 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69df60621dc4992a2d08a79cfe1553ede131f24047d1728c4ba9aee51882cd63 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50ec4245d1f8dc05312da9094a0dd964790b4496 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f0a0ec4a25fe4ff5a0a3365348da519f058538c82e889490c983889dae98cdb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04f7de005f31f5a79577db2ece36c91acb4813a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07a6c03c70400cf95f2cb000b0608d0a99c0f73a4ca3593560c0b1afeeb0d9e8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9e7ec66deb43432622248a238bc37ece5bb3c9a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d523b9fdcd4cfd29dee17068ed6590ddeb7d73b9937f0432ba3f36d4aaaf104 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d978a68d576bafd2f1be6e3491412a69d55d4080 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86dca3937a25756a22634f1c19140f56cd00102628b1d75356442234f5dfafd8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7dc6bd818f05e6e06266eb119cfa16b079266e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa8f7fcbe19e52fcdd07098def3f2fba3c55d87fa66d6d2ec9ec99115923aaf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8875135db51df2eded31dfb023893e6c4ef663d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:549f093f863c07ba7f12912d95d8dddc70d4a5986c865a177a9b48e1504a3935 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26ae038d1aef7bf6f86102528053b76cce65c8cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab29e37f2be515c636a4074f8a23dd3fb73dfe4427e6abbaff3b3898f4fdcef4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31d511f3175812efe9aff539f270a3d11bb053a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de9a45082adc8a47817543fadff62d14f7c42b95b9298a5b26abe9247e3edebf +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5abbb786a4d4c8aa759a0a84a019d74648b2b71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ff8b7e2b556c62e2595ea9c445440df25df8f4ebc53a58a5b1d8b851c1ad81e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a41b38df8d3ab720b5635a1a01091fa4ce30395c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95a841c8ec16952606ccc34449d4b2925c3da84e106da6dff0755b2c87a8dda1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..661e8b9fc0711e122dcc377cb125721f3a522c24 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f7f36dad171eefdb4dc5d4de675e9c226a255f73686a6b7df278f83b8640d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78ba2ed8b81f3a36f26127845385c1e205e80265 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18100441c2fddb778792f0765e3213102200724fccc258b17040571dffc1961d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32b12e3b7bb21d79a952798e534b2e48d2efd1bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f1159e76fd536c3ceb28318d30c93203ca7a693a092a4ed02675fcf706c9a1a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6cd1257299e4e5fd1cf05f3c4a2da598e96901d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac1292e7eb41f5a3792d333187707e80e355576ade5cd6e074420e811a6313cc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e913afc38d863dc5b2a1c438f0b867f896d58fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53830ccb74df1462ec3e8d8f5cb8662e0b69a35fefd926280cae4a07d4644a54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36164f506d1208d0c83a50f04310e0379d4df130 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b2b79e0a16de0a5df7c4d8e166a19ece6ae6f6741a2cbe9cbb205c3928b5f4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22c1f68a2f258d80df82e5605854612aee165cc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e556e598b1335a5e95acc797db607f74c1ba0dd738db48a959245bab012a399 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d6c9e3d6c53ec4962513278042c1110215f33d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4135f2b88ab7ac5add3e347fc0f78c581f76880991bddf3f5f493d0d1fc4da21 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c601645f904673ae817f725d031e1c26ffd6efb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c273547eee4a1c2e5cce53d206e042c9f4ce00b68067f1e65092d279123a056d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..307544699b361f29a28fe30fb0dddc5fdcbb62ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eddddfc44eafbb5482d070a999b0a5992ed9c42663ab63113cff6e3c82ec163 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d98545d8538e8554b20660881b493836409f331f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a0d98c874c169a36f08b33ada17535f1ccb6bed2ff2d788e74450963fadadc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5418d5309ba62b7ea79e16410479ad9dcb0565b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b79c31718f48ec08fec937685bbdf60eb6fd8b91d4de47fdf76eef4f699fe6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3b918b4fa7785d916e819fa1e6bf908674bf9bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:835a97e44f1b9beee3ef4e2439aa4df809e26c26b4d3d55eed0c14676680af89 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..761df0d5813fa8de00507d90d042de029d95aea9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c613826401137672cec9a66536d7fbd83732de08ca10bdc4b845be37e6412fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fa1970d43a3f6a20cb96b4008ea3c5718badb69 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fe269c8f538ea07f02a1cfa698def64b6fd87402bfa3d3301ffc456ceac3ccf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..595914d622656a8a0ef9867f99a17f931a192ef9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:788638627440f9a2669b63b45dd76d449bb09698799454237e10dd6c173ce46f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..784e49d9b0fbd347b6b8cb19f71f755f39d40ab7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65105271ed31d6269cb2539b5523641d530857fed2fc29d6644980b562154d59 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..343262778ed9ae4bd429aa284d2c2f4540f353de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77f2acb835fb4606a03c519e56f872e7f1b4a49efa60b74cb7032eb8902b12e8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..afdd2393b3c49e5ae0539d4d56a514806e84d5f0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d28df41c18d19678d7f4db10d0d469ff28fc7f5800948ca0a4af01930904520d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63dd285772bf1a2fc6d14273091cd59a7385298f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aabb3cc53a3d5a2ea93d50c9a1a2cbf9c0c53755194aa4a7e255de018a7dda11 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55c27cd763cff5c082bdbbfd46d18d83a35fc4f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b548df31bb0ae201451cdc08945f72f7bd0e6e96a4c5003419f2d37b4c7847e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cb648637c007418eb13a9ae9ff3204b9fe0fadd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08ebf735e567da7bdf5384589c96fb33f817d1473ff5e0687125b4f84010095e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c51d20f8cdc9440292d6d0534e416c00a1e147e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dda680ef36514a47d77162ead11bb0186bebaa5affb6e151427b66340f559e8b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e81458e13f0c062d11ec2628980434723ac36bc6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25326dc4ed60e0f1989f7f2270aab8e41d11d6976853821de1113eeb6a098203 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15f92c2d42a0bbf7ca365bd8bae17da72aa33212 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e287a055bca06a5eb4847f678a4b52ff28bc7450d20f309907de72d7a1dade9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3653267e21216093e1149bbf5580fcec08b91d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfccd38b3855deb05378ca61ea426bcf1b8e0aa8a04f5b1bb6c6ad425488229d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cadfb6a43d23ad349393709d7a4e6f987cc972c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fddb5d294dbeda271b825cda52202a5c77153f933e0118fcfa0cb53775cb2d8d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..951dbc721871defead1e665dca3ee1f7cb64c622 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dc7dc98e2116f5bbfd356cba8b431c1900623a7b7f2af884a6ee399c60170f8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b96f743416f956e472de22c86b49356879178188 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c60f9dc7456f2448627ae029156fb320b3bb0a8b6c8f3f7cd4cc4d2c3684d733 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5b8b027d4e792b467c3fecb3b8f27ada572a2ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e572e20b4d3c3b52648273f2c12bec23dc8e72e20e1690cc6b355ca9f610c61c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..890162575e90d984e82518fb2cb12d92f492cf32 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aafa43942047bdaa8227ce76438feb1e1897fe6db67198472170fb93563ee04 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..674727d9f546285e9ac8a473dd280f862cce2b2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1314cdb65f2617f7dc4885be37d5c51cdf57e2d7216ef62989a27ef356204171 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13015d6a985d048f817f2f89edfa191d3d6c8845 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:997c7f4d263fd85665ca41715b31d879d74bdad063afc88673c4f6e3a45e9df2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf53e419f6476681f50898e6d3514df30312c33f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78df400d7b16cfb77edceebc47cda070b5bce08c018694ed5b40a660b40adc36 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..652a8555938ee72a106328f3e502a6b96942defb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0109293d40a3312ffe30d8e536f8d15b380e6093553546a1a6f28f222b1952f6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7649755239fcef741d5487b3e89168e0e1d3818 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c21ff6af70b03a568654be74ccefe851dcb603685302696028a3a29cadf2af54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a5aa562cf513d7453e1706484e964db0397d585 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beb70766cd9eef9899d1f5766a41db320b04e87eed450f3f84a31fff323dd71c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02fafcec44e1bd9684c4c7b0b095faaaa92dfb26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f66f51a7006841cb196dc9e4d85b1e7837aeea39021cda3e03a2f9d59c75c98e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9bf6961b97fab2d43dd76007fa568299914cf77 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84f9495bf9b316abb6d78d9d82feafdd5bd278f233f8773d8ec88a9b988b8a6f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15f9f1a71c98a0e1e069fca7ec7cafa57f0f8f66 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d794c860f4878c0db44945433081c6446bf73e9a8c661a892e9a430a72f500d6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a610030de66af6e239cf05ef2607716690412a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eeaa54d0534fd3197a35db01fca76aeedd7d8c880996441e64de0ed7b0eec20 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5f80f514117c6525b1911c6c84ca2c159a84724 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bef540c2788b3305c9b231117a46734a96c800d7721795ddfde0d57eaf1bdd7a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..527fe73635f1f691187779782c15a129db6980ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7dfc58e0e362d6e83e55c880e80b1c0cd3f5535f155fd11b45c0dac93ee7d75 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e9f90176399aab4f60b32a7f6d71475d6c5b87e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e64485839ed330dc766e24fb99437e20fa37dea704b8adc7e724337c3ee1f48 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c728135ec13d540f5742ed8fa98de4d06d65375 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526fd26ba38783ff50c8e40c3ffe1646d8affe1f4bb56fbf5661a8fd6639e605 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6fe14f2c69f1ca49206a207f6bbc1d833d945ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a6885f2062f48a2fac0d66529beac101247e6d1163f5e1ee33f6e064a099c5b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad7e57e13714a33f2fd297af3464844eba57c559 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:835625b2cdefb818350d84aaad29cfc34be9df03ae732a1a9336d295b295e0ef +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8447aba28f1e4ce3d3fcf6ecd5109e22073c68b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d15c4989f2abd64e57a63c2d9a2ec7dba6520c74e23c9832cb8ca6acec2e2a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4027277919ce09da30057f0ec759806d76d6e030 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c501ee81e29fd4f3754e0b1660f78fb603bb638c689fe928b56dc3ef624b1064 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa801c1bb163afd28bf0b5f51b4137c715f135d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27cb315fd9a317b363963cc1a9048766713adc613eb267363a1893c74217c6eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..950cc2b58929f7e44f19e0ef5fdc9915b1d5c01d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0272ba67cf460ebc4edde2ce7b8b2604e50ff87830daa5e826b88a8cf6fa872e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ba50d53f5e58746189bb4e9683ebd774c2686b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c344b723bc6686839cadc079f7a837deb5b07da6f0467af3e99c0d28fcf65c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bbe3297f9ff60f4bbabfcddd60025e5f8e85785 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f560e388987f77dace1abfc5d48a4d5566274e654ac854aa1e2b4c9bd066cf77 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5be39d5f1dc01fd4dbe6bd4a77dc594b51dce491 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bdf96454b5a5e82dc099875af367b8007ecdae455f10232c76d828b284bf1c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..920e1e872be6b4cf325242b74dcefa2209182908 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aedef0789c577a8c26def7a24144de99317c2d7a463610f96da0e3208f99145 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5bb77857f791aaefe86acfa0ba1b402a322f310 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b6a6e96b256ac67fb6e988812408e1a3e9114a4846e670cfea6f6081ef9ca97 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cf8cab3311072b14012e1b03a3bcc6d7f35471f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:206cd56355b3432443a2b911165a20167463fcdebeaf7252d55c87d9c69c3cce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fb89130d57f919030af5c07da6ae5ee3851e52f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:192386f1d231c9f635fdf2a00b900ae64111d87f8278931f6f834b4f2f1c45ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d258630fee7b6584250e212a3189dcbf5a00beb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6382f20dd51f6e1d6da6ffb10b10608dcca7411427fec407d9d03ea0eb743977 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26d4e31d31fe0c2efa603504362b71ea8b7ba1b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dd21663be03d8109b72a0a6a15af185bc4285df59e048ed6582ec55dc2d2216 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6804870fe916b6e8daf869c5c284074485921dfc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d3772d1cc59905434533ea38c9f7068ccdf24ce987ddc8e00f417a3cfba4fec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8877442c2d53019c6ab098ca7f23f43b10555ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e42e162a32bc08078de13bbecd290fc77d464ecb8ef7c6ce823482ae8d3c5da0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..560e27104604fa3617b6b5acd29f9165c01de62f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfad6550513148163f7af617d1434a0718cec192473048f6fd4dd179ce8dfae5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad63ace83a7e5f56f742645ebd54a5a01d69ab41 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd58279bded5e262273f24c13b4dc5a9bbab4fb34d2a3c9880321fdb95631a77 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28c7431acfd02c76409bec450f3818f214bdc01 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21ec0ea3d34d60ef62af5bb6c79ae739757d1b9e7adc25a8ae299173bf82e66 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e426d0777bc476f755fe7b9aa2b7d90eac2b563 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9027b9999db439b4b2702bae5b490e161416b592067ceb3ca11d48e5c00aaf43 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8ec7d678d52c82a3af01b6631fda7ef292937be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a547c64aeaa1d5cd74e31cbe8f6be3b63655bf0f2877d1e0311627fcf678f25 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1dc3695086dc5219fbcea29d82758ae5b639d4b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ad3647a8e8da2dc7d4b247e68c052f8b2f51d6626dad390cd632dbf9bf82330 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87ea56ac0a9a4d0dfca1ec17ad670ff4d73c84c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4350182f48a7224b35572fe204095cc8ae418044f536e36a10cd0c4486c228a0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce248cdce848abed52851f8651289354c68f75d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:718713cbd4c50f47cfefb2f06c7023514b16e0f45016305d8475417c847fcbac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5971f283c96768c158c5c7a37b2c14888fa3396e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e37e1a69dc966ac0202c5f11f031ae71861df400ac3501a8f98005ffe9dfba27 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f90fd48f0a87f68754f0f753d8c4ee25251fcc0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ae144ce8dfad59d19467adc2ac9de40a0ecbf1b35a6772340e6685d53fb6b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e1e4eb08eed0e1704f49197f99829b8745921e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74fd1b5915425637d3008a1322eeed08b4ca6fd60ed41e0986bb489b1e56e2e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16ed0739175692f038b65831e5e7692f43e9e820 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7793a4bd5730f7d0c95e31ba1a55ff42197240062fa089c337abd3226fc86f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ee973dbe822893f847334e55e6674f928fcd2df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c9b6d1f77a9114a1eed109f235c351883ae7602ebb091e184c9584fca040b90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e70eb6b690ef1ddc5f4f6e7e1f910c581993eeb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d62fe5a41dd0f7b89ebd8fbaf3a1c728ac231e7b0d28dca08d0715c230f31b0f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3637974bf2ffbddeb55f44d022dd0cf673a7f649 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff3c67a99d6bcbb2d414014efd7509e9dbd75f777993e1f14b8cda7b9156ab4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e73479d21b0879b44584dd9a11bae1f047bbcbdf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eec16c2b28bcaa9c1c0b74e443672f674d3d741a35f58ea010bb408a17c8547 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a7dd400025235eb03fe5ba5718eb2e133c959a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95034cb31be12f508dbcf9b73e592ddbb6c0b86493a222b5fdf48e1e567436e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca9cce7fc77f37c17c3f1f1c44b47946c1700288 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7925397ad2d4a27ac80de43f34e3ef115a1cdbe201f45807408fa76c5131bd6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef79875a71fa570820147a8f00d8f62562cdc3c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:239354f271310d25fd807a84b7434385dd95558934684b2aad3d455802e047b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3fb8dcbff66c8e6d63585c0830c33929b4c287d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef5ad4f8a91c898cdb4fb4519dd0f5ef86e04230c2f96ccc84321e2d11d082e2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d41648d09da86f55a191852722d7b2f25f416cf4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e78dbd9438e7640cd3083b6ca403ce32a0c403edeeda0e602c77be5c9f5e5f0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26087225a46b07f2c71ceb8aedc10091c3f5b5ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:850b4609a14f79df0357221cee310a1a853f8c9d54d52f26b20ba4da9082ed6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbf4b478f956f95b82cefb3a0aa66d425a54fd60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd54983f38e338ef858897cc60c77bf33129b0c7b6fc095abf5a92d322a9e3e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51e620983bf98527fc46f7a2841ce3085b371c78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54ef8b57d5f0afee172c3c69a7fe142432980931620b6ca112bd6724c1e74619 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d15a55befe321de8dedbb53012120c85811cf524 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2323a6dc8c034dc934a726e60c239125008f6f3ccd7b6f2d6f0bf87b4c1ecda +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2538984566b2ac68ba070c996846a945d290bcd0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1899e8a6f3d2fd142bba7e18798f7f15b126af5c8a3e8e42ba8c24372f0b37af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85680d7987db488bb42e82243e7a49c9d214d886 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee19869372592ef6a9a60868a89ce6b3d0a038eb17056f5efde70c2f87bb3fe0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5de79605ce5acab9dff0b7ed81852f51ae68515e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb1aa951d5e867564aa76005759c9b2c67b9b56e48c29f23f9644e6187a15e07 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92d1c92fba3347c5b87aff3add691c443539fe87 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2c9dad96bd7df0d4b551cfe49ced18b45f8835728dd4d9aefaab35c680e79f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d7c6a32229a9f76faeb552fc3b1a22fbc44380c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:186df639255eb05a2311125d1b752c1869f841c6af9e2911bba0d980ac9387e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bdde671cd606e8d5e4602ee57f4425729319c58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f9ea0ecc8fece76066cfae35376f7f8f55c1dd050f6ff9794ac440a3174b65d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7ee9ebbb3234228f701446d677be522c7f8920d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e13510cf3c5e1c5bdb5270f329cf5632369e39a7370b6ed4f7635700eb462bed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3b881ed829ce938f5a863f8f0f52a46448dbcc4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b40e0b5d28e66b5a0bc650113d6d7334d09ab473e5de07ff77542725d97faa43 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8caabba6eb89c45ece12e0d1b94e7e5598e1d27d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c1cc212d663e0942710168c584790067fd2482e65bd1618f3c04ca7e3c7e8f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86109c6f0e5fd33704f0f44c1d922aae3a0692ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5e31a68980ea0f7a47d3b63cb78e1b1c4d0ed67b09e602e2775ff0bea74a0d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..248cf92c806cc073f4788e1871dc48b906c5fa61 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5616f3f72c8be35feef4129cf9ec865fae15aee8d2348b26bf966802c9f8d17 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..999ac4d412a0457bfbeb553d7427659f6588e764 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b637a46fbc33b6d29569dc7f726cd4cbe33b06b193a974079db320298454b81 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffdfc6923a94e5e272cc3e6b633233431c0b26ea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64c478d61492d9b1bb54b179098b9ff5802c4a080b7a714bede47e62b3971fc8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..809b8e075bd6a3eefb11b9b67bcbc645d4cb3280 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32174237e0eefe5e7d6b2e24de5363dbef0f3007cb04a9144e678c48cb5e34e8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..816d203d99c04234d810a8ec3858da7cff93fdc1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c54cff89cec6a553cfbc563acc2193f3b01724c1939a6f6d6a23bcb6aae42d0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c670537eb6b9f7f0bf16cfbfbb041b6ccf4e2498 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3486eade929c2d95ee0b5973eb1f0181b0cf3bdb308369c1767464947039856 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39ddf454f9fcb13488b98791eb2800973f84c4dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3af19e0c2ba44bd4c2d4b86488baeb66848fc4d021c1c0e7393295f6f0535d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a708388052f05bfc7f30f4e55688caa828d0097 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39ce13e8464772b7f1040b0fd11c78cc1aa4b822a316bbd7dcc373e95d932d32 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df233f7da901b5819853d15969670e7ef707ccf0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2c66ff5696fa6c1c0026d311a342cd001abacd7c239fa3bfbcd07374120b169 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed6c357f73fbd49d394aaf60ccad552ed06a599a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:787e324cec0b3a497244d444f071e53619efca18ad251d9c0eb682ddb8c38cae +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b63f8310da64cbcd14f01637370315b420f7449 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e07777b2d25b14b9baf0fd54d1540910094909fd66b97604afceba9b49f42f6e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7e1dfbe01c98a6a8616c463f953cd425f5cfe1c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4de6bbdfe5740a39529188c94392ea07a8855bedcd31ac4aa30d1e29c30a2f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8de62ed31e54f8c95c5b3b18c54de5768930d8ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07931f2a05d94e740f1c6449e182b9f716b52f71e7aefb988f279d8676618b93 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06f95ed73378b0d1e1c3c5d51d66fdec3e502d80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32aa076fce4397a241057d9ac3b0ac816759ade39607d2b0e5c30bc3493ad633 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..340e51bd2c83e0edb64b40afb6f9e06ebba7363a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c469929d3f009b89504b2297f2c795b8b210d482e501df6f213643052653fce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..306ba6e1c3e594cf4a1f2c0318c90c6880509f90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33ab74d386300a2a67d6271313d0b89f0af73efdf7ea56af366a2c9d21f44c83 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08166eb8c07938b30e2d56a2f0c388b9f6ab8685 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:777b99d6b892c196d84e9be783aaeb8d826225f2c2946919e74c38fe11b0aa29 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7cdd194558c0973376d92955f24d43527ca15c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aff9ef2f5068848fd7bc1c793d2fabe191eeb98c624322f43f9524219c14e01 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb0f760c3401a2dc3252dbd4f0edac4f4b67e409 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:948497c714d51533c51540a7a1f4d76427ed5c45d5d6b45aba72d1c03a331252 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a02b4d055589e938b4d429c695e4764527fc4c4f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c415ff1b523825ba810db44490d2327f22fa86e3537e445c53bba067602f7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..998a2263a7bc70eab0eeb0ae689ee6e83f4d47af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bf81532e43b8d00c4bbdc68037199895190511428ee54e2990f455fac22ef24 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9a1bc493b1aa6634a8dc13963064704cd945fe2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:008f78597fe34afafff480322ee1681802c7411fd01c2057c119548da14189fd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0353778a4969fdac9d1cdf09ee70d9b7ae0e3f42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a445430774b46c403698ba90bf3c09145ca134eb1815d49ae8ca286027fb88aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3980f4d9cdf9302bb74f40891d76b826dbe893d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd8e2e23dc39666a61a083d5a75f47a18481772abfad3075517e694c5245c9fe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a17458af8f184c1e3f030dc1dd742be642674c67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05cc9379992bb0c584d76cd1cc01ad90f7df9b0822d3134588bf8d007d977eda +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55991b8514aa0378729f427fcfd0a254d2135718 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c943534f17dea2f48194f246dddea59f2fe94e0e6a3181912ba7fd22293d1097 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..716f1f14e8bcd1f691346d02c6c866b0072534c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0909b9539f8d81bd8ead84fd8f0d3e1fff55f7313ed2764ad34c8ce6b581496e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d426b6e2a1412615fe64ccd4006fa1643323e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35f039c63e4bd61150d610b6cce37d8b302a3a23f82c547e19b8125c5bef398f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e6c3aeac4b2df650e19c6ef1bf713961b4d71bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64987e9d557958bcdbb54d1e83abe2cddca01ecb53f52a7b2e93c7735f4693ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba11782a0e702df037dcd9c084537ecde3d95b65 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb56e3969edb3b9d8d617c2ee3a2fdf59923ee6249eb40465bb12d320d7ba919 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..375cac7375e555cebb32a8b8eaebff0e22f7966b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95c7a571ef8e7946e2ae22e97357c5c3d7f6f789d042dcc22ae9b5232b5c023 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e00fa73c51a8269b83841ab91be6c3e3cecbe52a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8984f9fc3df265babef3a9b3c30a4d710904c0ce47115b084935e3a39da9807f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97d2896fd0d16688d5bc99a2cd1cdda12e83f4a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b6e1fb45338b60c7d5e5dd74d277001e1d06aa8e96475c95d66ff73e53d27a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3be9ddfd5db12dadaa8d1a1a370dc999fbfddf52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6c874b55acaf2f63e3531e7de1bbaf41628bfc172b8dd942e342e6e6d5dd7dd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f776b8e991c847b7f2449e0af6836886d45aa518 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c6fca7b6ff273c12d911888afe588312e3a351d3b167b88958afc2f11092b1a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36ec0ed325891ac625fdf682258636c92db4c906 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:936a87173295361e9f445f074230783ca072e307e2b905dd27073c1dbcf9dcd5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99aa73ce3adcb3505f3a6a40b3fad7291e25bb6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f798808ec02902b7723bd8318c0116144195085510eba80a43c05616dc05876 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6044078ea26c1216029d5121020efec216a55b6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a67720d81f03d8f2893774708da2ec95565f12810dab90cf191291041bc400d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..671675ab53d3cf79187a7e997f4927e5b39a0016 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:699e208a667af6d0a38e8d3ac0682e758df4695cc2b97197b330ad931e93e0df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b00f3079d8c4051cc79b149f128b71d989fc903b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56de9a84f63ba340054ac01970cb9e2b27f58f20f0562de84bc93a18754773d3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2089e8c1bb3d47a93162a8b0f63b393c37957a2b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34d307017d9789d5f45195d245ff1ea3dc99b604cd653b0ad6ef97bcf2a47e83 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f3232baddcb787a0035e2ab3c14496130e83113 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f123a4bf8db60d9338658cc510e18893bb011814cafd9784d242e50f7ebec81 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f93744cf0425db4a44e2e0c8fdee8b5418b0454 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0319ea2cc8dda11977adc47cbe4bb374d469512c0e50a2333388cc2b20f68d1f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e535cae7f427278a633023a77b606a4a98067b83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:647f26be036316059384b01fa797d4babfed7fbd5c4ba5e9ce275552e9815602 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5113e8a263c70de478b875c8b326ce9b196f8462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6e8edf94b1c8a29fdca67b63a1a97fcc82d0b0fecc34c47c14e60a5ea78085 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c30384dcf7ab91511bf54dcbbc8c4dae087d8c7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04d6d00edb92781ee144a24b7cfc5f10e775b5e2914fd3e1969b1d30a3f1d4d3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f29410c716760ac56a9e30ba9534f35b7ea4db4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0980306246c4eca7923889264c5e236e81bf908f03d771198603c8fda7fa9ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0979f0b463a8866315bae491d5a0c23bdd2cebdd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d147abd24005bdcbb4b91ca9c6fc8e93cebd322a97d3b46219d05627dfe42ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b7b71b0f8c43ede9ad0851b242c4d5c3320287a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9a6d6298c0c82074d8385094f948d21a6c9a8f0806cba39cc1fe5cc1d519205 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39d3029c49f2c9fea0b3ff70eae3175eb8a4318e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8019932e1780958bdeb4808cc6acc316941b0607a5cac7ece99aef80899e6718 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e19765fb5d8ffcc8d668eb856523c697b830ba8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:469855faea5bbae171652ae5f806b23421ccbd76115c5c08e217aac3abef4c1e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd61f81938f04656e3b56be2108b66e5d343e7d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:332283a5b2fc6dd5f265b22d95c0b0955c3ffe127c62ec76694db34563afed98 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0692d8b601b5d591eb6782b235643a845dd43b48 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fe4d83d7e13ddbc635b3ecce86e8c802b662d173c3b125e85ece03881ea75e8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fb35f0b5055041bd1898ada421bdff342d856ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aecf54937656d8c9ea9133eeeee6a7b876f913d5d2188b4decaa90302f51e73e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da28ce7bce74ab018e404f56510fd2e1f51dc436 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98df43c44199414a8ea47b4472eb18c4c77f098dcace2ee924141502b3dc837 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a15bbd0be7886cba597032ba2b186df813710a7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5454ba70cbeec1313d29bae38f536ce875b9232115b3f7a6e33027bbad410dcc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..acfd8236d3455ab19cab25bbf3824086c6ed89e0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7280455cb4d256052e62d5f97d66f3b2b1426eb92448fbf7111b4080f22198a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16860ca9c97c154e8767fa31adb2a0f9e64c76eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:069b924a885d659ce5deb7c1e0d2caab0f4f2ed6fb9d08e10725bcf31b9baacf +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe415c7812f33f9bd5cc08eed8fc0fdbf0a3843d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22c366babd6b5869a907385f6607aedc4a15adcee7ed4b92e5a72cb6461312ff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..495a0c73e2f54243b36dba02d64b8ef7eb7e9bdf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18f8bb71763d801ec9b92af5b24e62c477701facae08b76ea574ecc55986bad8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5222a91bd44e4a8e6c81917a3c90ecfdf6625342 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ff541649161997d266f76d5b05a35ebc9ba0ef8137d573d180185c03df81fe9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..476ce221cb3a818b0fb5244ad505ac6e93d777ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b768c3dde8bdc18ffe73f5362ab5ab63d72b2494da9c4b429a826b8a927ad9b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69aee2e740d6dd52ad9bfa7c138ba386e913d7c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74cf3bf51353170a2ccbafb9f5a6e62b65c99434ca328f298fe0ac0ddab37a2d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a6e891289a329d91547870207d93a5e3a01f6a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf2161b717f8f6bc0e6891fe6b28905cb35a366495d9f724f71791552dfaff07 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24a6a592c20d97515e069dd8ee6bd5247f011c9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8031507e804bd3c2c2a990f16977274ddfec48251e24d21c5a702ca704c58bd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6882f0684d4fe480676d5e4095b1fc684ad184fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:485791dcaa55225af8b34b17b68d8e62577973226a2bec4358048d4c10949856 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e55326139677e4e7201634c71dac9de35020b3f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9817d2404fe4042f5b006ca9dbc0c2ad94f03cb56bbe664ebf29aeeac7b8b010 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ab497e345193b3f5d9d96bd0c226e5c4a4f32c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f57d090ea9d868ef8370bae839dc6d7cc37b127384bf06bf2d33de3264cca52d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8e9fef4691e7c38a058bd1a21520c8da73c9e6f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:807d059cd6dff6b2bb8aa213aefe9f9dca11c06f2a60319bb834109c3c08baf3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1351aafb197698c17cc72ec9d8da19bd603c2b8f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5162dc3a618104a678e511d9ca91a329a9b461e79e4e96da4dd1896fa9c37db3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0699616be4f5e5d7e614e42fab6721974a15c619 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb1b42e169a293f617e90a697dbdf1c8c1a2a159398c650d6335bd44226107b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b46237b5622cf9aeb62c4d532d6b825d0833d08 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f216d03f3673abb01d9a04a6f8834586011de509f17570f9b6b0113308cff90d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42c8d049e6dbfc979bf6e54d2ea2d1b2b23f6259 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24113ccb9995502a5ac220c18305534ad0320d64ac80137d95d075bea6720aee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1db87b94371bb17a4be6af79dd41280de59796d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bba90343d6a8fa295ba1e300c60ebc7855e0463a6c9c583701160fe0a9633faa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63519db9c63c5096e52661e26b780c34e285b458 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545ae48e249f81b0254281be22945bab8705c4bd8724adc9dcf81f776ca9a162 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f32081aa4d91baa48dd8582c7f227b908fc4c89b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3906b4304ed9d3f1114a9eb439c59a0eb4c982019347ff4216a68c6a1d309fa +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4f867e589eee2f43e3a28c1faeef92b32e576fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a48d89174659bf872e0f3f53ed9cc57294faadcd36dc9ab98b80046e23783776 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b8f184d6210cca057316d6faa8f99b965e3e011 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39f4e2a9a89c3fbde6a5f1e7eb178ceff2016e6624e43a6fdc603a57b25ab9a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58c5569efae0b801734f0f8bfaa00c059f83a690 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c67b48e50ce979cef5fb24789787d5b6af5079956fcb72444167aae12eefadda +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31d7c49b36eb6365546d43383b3511848d65b7a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:751cc938b792f5b15f60b3a19bfc917627a95fc9dff2024a63512c761c145c4e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a29a81da3ea77f8e2374cff9bf16770b4b2b3a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e2ded03ad7e62b0413a21e94310722ff5cb6f01bf74995faf13eb975e77728 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a445c7eb4aff6494f21da44c5b749317899ce1c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02cda5a8eb8d3f64c1004f35df099f98c33cd73ef6f3e9a1b85669faf0e2ed08 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cb26bf98d84ed44bb20918e43ca6af891c35a09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f89137c4c0f3ec5058b20f665a7ec8607f0def429cb9b20d3bd7d1c564609bef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29f2e07ab3bc6ad963da415349c1afee96f2a52c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9980bfc7f31ae5924314d2e2f7953912b3c30d085c976950004464062b35e25b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4753fc5372ff9a9d321f4df00583f3a66e52bc4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:519af7af9e508202ad2a348b809d8370800d1b4504ccc4543e8e7564ff87a9e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1aa355a3641d2d3629570d8c0e1faa21ad97f120 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b674b46c7f17f64cfbaaa2242de454411f4181fb8dfffd67c1957de950e9e92 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76762915b0928d4b1b883e92b0a0b09ab9fce7c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b7dfb0dc4a263a63c7ee96f71aa1c747c8d3fa6787093bc06032bb2c36aa0ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1caeeb4fbefc23063dc4de34daf69e7f80b55bb1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4929cab6272e169bbc5a3d0e9be1bdb615218adb6a6894f705db9f28e67fb00e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a77667d5a2483b3e8f08886c14dcf7ca11d0d62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b454de9cba6efc6ccbe39e510f914abec65dc4450430430e1e733b069c9e8a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2883d980a94ed6477dbc51ae0070b1bdab95a8a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43500be530a73f1f37c96ddb701a73a66d4a174def6056d4b6e2a2af19460d31 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf4104de962cfde167b3df39b73c7d358e745cf4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06bc82ec3c6e5260b425a7321c406fe4150b8d0e2cda53cd7564db2b8482e99f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a979cc2f02848c0d20f0f2ff078412f27c48a0c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ef7e6e33c638d22990a2e99c617c54bd462658c305f48e0c16ee7bdd217247b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdb0120843374417f742e52c394b9378846306b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60468d639a3963523c8e32eaf7bf2434e1aa18bfb3b0ac4874ea4b2351579186 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f1a8d1955850797518b6c351201a001c059c94a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba9cb5733402604029a37b4dde1d92ac2a92bb28cf7693ac065c1580a69058ad +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..105eecab9b7548747efd06fcc760b09f49b28f59 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e962ce6caa1a7404f5411fee07e274515d86b8dc93069a6bbed1e6d128b0e9d4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84f7fca45946fc0c2a94aec9851d595982566581 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0d8ef72931c0637cc591c4afd06ec137078e4b436055b0dd537d8f2ade825d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d5147891d3ef6ddae6b33820f598b65b44f3cb4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30c0f8e97fa99ccebe5099201065f9df202a0c409cae55bb9c0b6ca0ce57e89f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0089c94edc615de01401e0d6b6741371b13109e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d993b2a05224e1cebd5e73e8dac6f4c2f51df3a6307ee87e3ee6a972c566d9f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1155fe3b9508590fcf51037b913c873d7ad6ccca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac126521caeb46bf914bea883d24af2a0af35661671e5af2bca9d41bb785369f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b94eadf3b5525ec0febf4f26f68b6cad46c237a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8efe5f5725c41b7ed3324005b6a47664f56c0f93f792ced1ac3e5a6e85e0b9e2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63e13b89195bc6c9bad06380e2e1fca79a474213 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e57e99e3e8079880ffccfdfc87f818621cc9f7ad0031f41bbfdea63e04d79fe8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f09d1db74457c3d91d13d5df589042e8128a0186 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e86dd2d8ef8a035845bcca423c0e4c8ae505b1503a2112901fee78cf46dbcbaf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38d109ea7c3be5e9c6536ab75866a9f8c0cb540d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7052ca37c96fa6d8506a48d659311123fac96bdc48308a7e46b17d9ba9c6c205 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd2c62a35032050e5710f9c59aea9a871b269435 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ef178046b0fcf47062fdb89eb2334f558dc13c41889b19635998e5fb64904a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b7bc796617a52158f40f206c94fd01a0e2c9d85 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:756881462a171d970fd73fb766df0e418c64060e1d8ce0ee293d5a94cbc17867 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39d34c4548d94ce4c17059a0b8ba7f5e65ebeb45 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:702d6c90bd1f9903b9d7d9e0363d9c17d792e133e3bbbbbebd479c78209fbca6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd47277708295af4750578c30bc4ea22b5eb9a7c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb78c9ab90e2d4d930f771365c959534afc0e89c67e5b1d771442b342c67ce86 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00bbac5b0d445f47a101158cf42b4599ce34076b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bd14bdfa452548b733e0edb9c1e11efdb36ad42671278b1b80c86d82e7b3d2f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f00c451a6cadd1afb665f51d9135d6eced806948 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1251ef44905650fb9b931825678279ad75673967116bec9871d8adacf636a832 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97c1181ddcfb28b3305eeb2b4ade6523738f4c03 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33a4cb62e38504c98ac93474c1eb08cb85e3bb31474781389b32869fb2f0bd2a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b806eedc9deb02a74f909b739826e9adf30f4f34 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa7cf32cf6d9eb83a231e7c7cfb282acb7c86c3a799d4413833c0858ee32f4a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06127fc9f8a704ed9f9f421174a8b22bef5ae3a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd6bd4b1bc25b2d1047c4a687cc678ca190f10b8f6157cc037538d2e04b5080a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..729773cd691a4de4545f590511675ef91db13be6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd768f48e6f5e538a8694cf7e4223cbb1f50bb48ba0b957f8c2ce929e8d4c352 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6114807aaccf5d92b7a3bed5d756cef60f457277 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b5d2c7f70b908e11b53143b775159ca7c2a73493be47e639ce74d359cf3659 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f44a5d89cb27631c1c945a0f6d9c00baec62df8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:783b0af8f18dca968705d6426a6ca9913283dc4884fcc2b16e967964d198cbe8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fb538bc030761e7611f22601f75c09e7d984026 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faee703c0db6cadfa9b419636d336a6871215ea04c98ab2f5a74fea58fdc5e38 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56b655dcd270da0025cce39a080529ea0f8812c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c148bc299360edb0128c5e19749c7c12e670a6de9efefea074aa65179a62e676 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a598fcb9312a58332ca47f2e8e08dbaf328f344c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3ac81166a7b7a3f54fed4d0b200ed59250cd0544b20565f0fc9dc9e5f04b8b8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f613785033d8424800e2a97c622678ba19f0b2d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d470ad3f15b0ab6f9f32385b739f6e1b7d4295e387821f175900aa5d77d55823 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20a84d420fe8c64326625c9aef1330616bd88295 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f27de98416c61623f573f712882cfc76bce267acf22c8259f055f63674a832b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a88aedd06146c8945249b6f622ef39031ab6573e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:258a571232368455c158440312e1e34c5602a8ca4486429085b1806de48246a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6222e2851cdf4ff05e64110cfd9a9da324aed6f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d08c7c545fc736ef0a6c4e9e6046a9532716fd85ad763bf5789815b9d4dc5889 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8df72126770c34172f2cdc84a0c36ca68794d145 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aed91c27288029304d491c52b168169c1fb8456bc702b4e0561e93844dea392 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4036158cdcd08e0a3955ee7699f7cc9579e46a04 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:484ee4d4cf67aeb4b9aad0abd81becb2ba414e7c5f854a27558552e6abdd1d51 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..988b3801cf1a087102fa8e832c7d8d1e60af52a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d966297e985b63907acd04c9800ab35ff1c7a6177aca7a8e7896c9238de4c60 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbac2a3bb0759290ef21f0edfe01b9bd7e99318d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59af35c6450b0756a012ce8b4ea44ed4222f89b6abf56a7198681699328836d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d5300ffcd4466524c65cde17cb8285df2555f1f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19bf3903f4c472b0f098c0e6365089a4e62a0621e853bb69832d3beec9188e5d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fc76b01491ade4a6a83d506c826a35a9c84b492 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1948b5ac3aa72bb3e2cb81455175f2f4ccbdccfb4703938ba19d0f03ccc1827 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c80713f7bc43b6671141b0d90b476148f3433e5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3203714e886f026d939a548815381f1ebad8674c0a47b1aa3dc18796d62ba6fd +size 11395