diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ab81720e595d71893531554618472f8eaa44e38 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95975d69864c0c13d5025763158efd1d28b7bce1ed807960845adc57478316f8 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b37d6b43cc80411dea26e01d1f75493fa52b83a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fe5f9012c94b6166f786eb3218c7d2edc1669864a69915ff3122d5c749e8e84 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d4c6e7eb7a3cca198ff161c8c91edd1647d5830 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:294f6cf49e5dd29a2cd0eaedc4b2ec8cbe7e5934048656db08986f0314c04d9c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cd18b7a631680309f684ce67e190ccff2a3dba3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7c7a0b1c0b2fbfa48f76e5ecbd155ccc147f6bf4547a887a89fbb2e9a252e47 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53371a0089d933c02cab4fc47a79630ece3701be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:448121e9a5d752e5fe355cafaacf461480aa3928c224a12067db9720415b0bd0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c7f70829eb6e6960b6c559943ffd90d4e125575 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfd23b1298aa4d7f14e58b84b2391c4afb8e5a704bd4170c896e5bb2ebfd8327 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e85e5d4f7d3460aa777917fe1ba5dfdb1080d42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcfe15eccefe7242ef9713073fa9bd9da215d72bacb6ffc3f01817c112326dc5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..606e13b87ea91d01ce7318bacee9391fe5ca8d9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a630542b2a48e823a3fc919357854ba7bb375e56561542036be3164c876f306a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2373af5f18439893a4a2e7e132baa851fc2d4a33 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31f3fb4838c49bab8a61bd77de44522d92a068c97688dc3b51fef019b50c74de +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cdd40327f00c6ad50a92b4d25354945d0df59fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:748a6b1fc71e33e082c2e2453f21875e4889a7a460763a46b80fb9cbb974a866 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f51cb910dcf91a69a3624b4bf3264b7f5b6ac951 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bc0a414fad39ca74b69adf66980ebda76d38bc016086a69c4fae0ee17c2750c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6684e552b0ab12fd17fe4eccb25a0980996c1335 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:509ccb7d1a3cf9ab1c0e749a5cce46ad7281450fc2e2b1a6d678214e9591f9b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ed8a5e8b3fdeb6d5bf85a38aeb5017833e4bdbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a8d6ce5baa096a419be81205d96e65ea854985362178b8f5a367f02188c96f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a17dbf01f81eee955de5aedeb0b7e930f987e0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c268ae5b1f30eea0380ac5e240ff171b270c649274a683ef18042243d941c6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e33d2fd52e6a947c3b0900b3134c19dc57a0fa7b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cedf795fed859165dbbc39f6e6f234a80a15302418ecf8e69f736b469cfc5c23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a271cb49043351cc00ba62946013cf94f18b6df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45e1acb0e63bcfaaa92a351cc01631dd1c6959b8ba57f5afa1ac612300c8763e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2928aeba3fa7ccfa8267453cdbe62130428a409c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d8a492c3171302621999877a6c78fc2bf54ec58d6a1e9c504e072986400ebe5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5f639d4bd81ac7498277376bb95a76146f193b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d8967cfa53d03379543e8775a080f12dfab120a9eff8339db57002ae69523c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94f5f4d582892333065fec03c27e0330e2d95576 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65addde48c2b5a797921f294c9f7faab6d09f344b6ce706f0f9bae440236ef2a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bef87357a6fa24b8a24425b3502ae95fe7073ae7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4e7ae19524739c9fde970373e67c084bc9892e9f97c91fdd29fadb352235099 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..168896137d2ce2e82545f103886de014b1158cb5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48609535525353b10480a5817fadce1491adef2be4c0fe5a728c781fcb40c7f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e512d9ceb1d1f2a46938447782a91ad85326126b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cd06480318cd8f6ad441336588661974fc2f305a6bc36ad92de010073b5cbcf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0492482077123f43891b5a2e61c0b363f79ce4be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11092fefe77a8ba30d8f13ccfcb7b27f94e02b6a12d15cf39b545d7f822188a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30cb83fe41a238e58bc680e910f8e74d79fb2e44 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8450ed235eaf710373794f8b8494ffd2adf60baf4b06696cd82f3c46e5ed0a63 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1224e5b5f132a931ca4df1268354ab4dc6cd1539 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40d55a502bd0168b8c642c0ea6e279347d5c205d185c1cd02f18b4c3cb6cdc09 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c748e77eda17895eb830cba042a71723291f11fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd65d592603d5d214b68def5f05b79ff2d233d2035e5df3051d7f24de3fc5e4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d3729016ea76f96813eb19da8b0bd267ec90015 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf2a2823e50701000d730b8113e5648e98983318e4d970d50c7a3801f6fab241 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab275e0d2a4582fd661d2f71886e978a4d9e8677 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da4899adc189eab9da03d90dda48ec4a0b6a0944d111cf179641b43e3ab98929 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a99cd0c54aaf3228dacbd69d994a6ac71ec0506c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aa565e2c83c846bb1b813af32a10496c8b3d19f9c25a147b7bd7f747784e097 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..efffd32da9f533de298c8d889797ed39dd1fcce5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86c7a76ff6b1ae692297b9c2c82555ab2e0a02c9d407bf1eb833f42d052cc76b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da001a53c77c0ed008c5339204dd215016a9684f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54a0b574eb9ce35c175bf4b6736a8e8e8a26f96462c4d413a131d64f2a267463 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eee0ab6983bf551f5475dd4b865a18c1cee5c0f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50b553d82053886967ddea45ac3f58e3bb3954e8d8ab27fb9bd3639d45b39eff +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea3706c56349c25fe9d7bf22c4230f6525e94a83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a688de95baf5ce1190ee1d062d1edb97d5f964b6081ed37be4db4ac5e397741d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a6bb0ec0520bbec2e4fc2a4223d2bb15c84dc87 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7415bfdd74f548d38b73706e10f04af26756b9a03f0ada2616069ba5519407d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9128a3c197604f22941275dbcedeb65fdd0b4ff5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dc591411e9805386694ba1c3ecef8bea15c26c3c1053c2802740bc8c8c9a968 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f57fa2eebf002d8cd39c940cf28ee490fb15520 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:169682deb38182e64b963960da05c4f7dd449af548515bd8405bed855f9a98bf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88e55031dd5fec72b44a1e8de46f1ee644140185 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a698c0795e4b9986dbc0a906525339267e01c5ede908874897cc21ee45e8dca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bca7479b15c46128bdf19e5e79975403192f3d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3164c3b5aec4284a4e3a27d2563a67a905534617ed7722e496e11a2fe15117d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d1afd7c6f8e809fc8f5d1d7bd3a0e07bfb8008f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98508c771fa235a930ec21be149520e57c94cea43d4d4f98a46609f3a5da5e48 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00d6482af052c0832eb0f9d2790ec261ee9e0502 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98ea3b2b4395ab3d726dbb6c8b3d038808cd5315ac060f79ec106e42bfe408e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61ebe4b302d5bae53f2264a3d26df0fd36055650 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaa06619fe82dae262bc1e7448be8abfe4d1067be0509346b2ae13c44d8c3c10 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..949494dbb09db04bbe62363ef60d3d9dd7674ff2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80556bc52505e7762d654f915b3b3a80c7a6aea14f66ef47b509ff4af8bc9a8f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a15b2b43401f56f1d1c83f3a3ec047e81e955f1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f85dd3cff0a2becc1079c43d6e5a86ca8f2bb2855082d43e07aef53c49fa5274 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7ab94ed31adbd85df9c653e8badffde833a7ef1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa9511935cc90334f54fad4c6b457cf694fb88ebaedf32a57f3dac166a0597bb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cb5a35917008b5443b73b4bf91a71318bd99cb4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f41c9b0bbc66616dd8811373673b65d1deac2cc72e8c08d43337383e399b9e37 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24a80f11c21416565415281bf23d9c890f806e7a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df151c79b14145138d06d6c056c7e00e951d474c792d9d16b53f021647a08d56 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e324cf5944d6005a05392011dcc27e9a4cbe565f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a0061dcd723e85fdb66a813a12855f64b44ae93e814496d7471427e71de3151 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c592c45ca35c2211c5a36d0b135dbbac61e8aef6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c88d18486eca7c7a96be033484f2473c275286754aeb9d765949a64217cb612 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a6021e2601d529c429ae7fa0e63d548584052ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac2dd8ddacd9801f8d38845aed4250643024227c72a7c8da5fa32116aca378b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..223260c0ff4f926fd039fef2922b6be0533f22aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0e16bc25bc5b126ba6d4352c7c86089f9be4716dce74ae3a20405fad2e55491 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e71b63bd365e87687b7a240ee246349bff08ab6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8fe6b9137c93a72abe352bedb5acbfd3c28f80cfca1b5684c8c4e1dd366bd08 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0658c1e8a34d33593eea66bd00540c04af2d741a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa518080f630f53fc061358acd065d627c8f571254273ac4119d5c75794e3322 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7bcef817da80c3ad382aabd7f622f3b971851f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dff03ad66f64d413033d4e522a9b78e196784122ce6268f5d74f3614482c358 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ebfbd7eb4eb106f9219268b659ff8c3ff60ae26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:787727625b13335b275948aabda2eb6650a99d4fbb21b18eeab5b4cdb7cf2dd3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdd493ef1bb77958d3c3dc4734f3a10dff4bcff7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ff39ae12818a49eaf743df0a387f1f71d127709bd18773055e3d56b071df974 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1cfadff93a80ff3153c9971f22057a106d6253b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:528010097daa9344777490a949d468007e4bd552004d020d1f5c92f2d1e517d4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5514ae359428b192d3c8825bd36c3094fb651a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:888be3b50f17377fb3164e06158d561709d8b32c9fd407b403585342aa7ddd43 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4de92cb611b34e163aea23506719bc7c30cd110e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b0df9bd37541bfa0868eb6314e093ef2952f8a46066757b599a7e91a58606f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb7869f9d88fc753eb150d974a367fcb9fb89f43 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17254ffe2990ffda4f8dcc687b69bc8b1a1887f823cda7c72a0e34833050284c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4c069c3102476da2f5f8194e6ea814e29258933 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:153790cfce1a85115b09920d3f78afb0c8038d023fd905aff26bb23b007960ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b844183ca8ac2c4e356fd649db2ae206665e490 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90f907df91c381e88a3a427987729705fa4fb5e5897fbe08b3f8e46c6214fcf3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f3286fdcb11d114129530f044f9423c1c7524a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6e2a1e2598efa02e0c070f632f9a05c32b7d96e74943cf017c4dbfefc0a3b6d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8613057ea8b00ade04a90cfbae7c5e21594d303 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acb2c3a336cdce964e74d0b4e26c6912ad16efed93be088a4251ff38386ec429 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..624c34e4cacb5d042fa11729385cfc0e459f837b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0e422524cc8ac731e9dec75b0d306c759992dfff77d4ab54ec4b08bc88160c4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f7fa673e28f01cc134a9dd0a4b93003e56679af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99d8ad2133aaac691f6edbc70dda706aec57e3538b487436924099c22514d68e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07d2f66fb2dad637f6b2c206cad75761b8225a90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb84926b7aa9a35d7dca01c57320e8315705966df0a08662b23d1552e46c65bd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..560e6175458662daf5f770c78648db06d9f13488 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1fb41288d0cf22da2e6dbb92e98fad7371e1859430fe81a8ce477d535a5e372 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4999361dbbe282dbfe4c2191cf0d3909ba35a780 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dec2d88acd02807418e7a873eb2d8978fcf9e62f96c9e4cc475a392879da462b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ba4c587dd6d0bfa475ba16a65fd1b3d25e3bf29 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cf9b2a53bbe44194712740b8f5a7eb6fef9e09185fceaf84ff35137c6254041 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7e7c2f43b74cc3dbc8673e97355fdfc3b6e7b9b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c983b61a818a46c3ed00de38a80ece51bd2fbe47b1f6c9bc066c1896e8144df1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..906981eb0110b5fab185738e7e06ad274e082042 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25ddcc6b9b269a87a02bc9a52e325bab3a2ad568961bfcb7d4c24dbe19369500 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..536a0674564712dbc7eba62c943b2b33365e0583 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68223783f67dec5d2336d0e925773221b8c8ddf9dec93c21e2d95f4d392caf35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..646678231874321802157cac3d73641f81e518cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d68c58409956a310df342c624dd161b8bd4fa1e7b409600f4c44a3783ba31b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a21bacb5652c5b27eaf098da8682e05ae5e9bcbd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eab56cae4df4c7ff04b601c859e809b6de643d960a6f7bb55ea6a6c1a561822 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce4904489e95caaccd4b2a975e3bd260ed372fa5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cabe83dfeadb29897f0743f677e1844991bcf77dee7ac5f04ade7146f655da3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b70e5b8365837caa682055868473bb1580e8c76 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e7e51ecaa4d0b8845e3a9307c98af79c1c366cfeacb979810012f35f9d43fca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7aa4065885b12b675ec72a2077e7c5efcf3393f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db7cf1611ce0f284e1bc3a7da3f828fa6398b9677e06a2ead7269da361a68eda +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf5b2904e0c2c87e891c51ffd5f595ae4aa80c8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44afe7b027e445a3c0f25de29070af874ddf39d1aa264ca299e3affd862e681e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c38aa600086fd0eb22ec1c3d08d44c07a984c2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36e5879a8093ee3384634e2a9c86f48b3667a5e4b009c1673cb7b26847676bf7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..732917fc504e6204a76a9b3d47edf169ee5a2c40 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae96a0cf18725b91a2f1d6d3e34d24856f8f3f564ebbf3cb2552859e5804b73 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf7be31f0da589636a4c032b21992476fefd4a23 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5adbf01214fe1e0f6ca90533de71c2e00f15fe0120d5f7aad094ed920075d69a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..516e738ec20768461bf2fcf2001c5a45a10e49ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a95e063b3c4b6db45181938389bd1250e2fef8cec926e77722433e3a5bb769d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2048f1ac9f845c308b07405a910c9e215fb2152 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87dd42c65b7486d1a0d7709daa4fdce125376db3f1fc6360679efea9218d9056 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ded645fdca7213fd217c4893dd68afce43f7f31f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db0b63d4cf083abae03045019463694b202e57f98440f597a15446b69c30fab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f96ef65669829e11b71526fb96dfbd47c608805e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b2531db958824a324ec5b0a9a9c8fcfba4f2c41d75fb347e1434b202c4196be +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd73fef5303564a426d50fbc993aa0fcc2aa8f25 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6769c50b57197a1b9cdd8af56e1d126863e6b0c9308deb17754196687e298e6e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d88a6ed863ad978108c5b588e653d22e628ae8f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2cc82431cea27531b908b5382c7b58c980061cb96273ef2a6408a08158590c1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c98ce1b0bd1089f13d00c5b1ce9f9749684f3151 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:860e4380571f91e3cf45bacb9ac21973e0da7084748fa57dae26f89521caef3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65eff5b392a1b6ed22c59a3efa9e72a22fb509c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cd6d8e3c2521a4640c0500a12c844259565a0d22bf17cb6ccfb05372ce39ad9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a49343fcbc0011c013a7bf97d76caa65032b372f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9733f9c71307b7f7b504c7b8c241a5ce2d52318be689957d4c95f3b84df5032 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..125639022311cf22c2388abb5ec3bd2e92829061 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f66d846031ed082813f9d1db4c03572981a36d80d5882879eadfd5120791cce5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f931c930f2642b2edafc8c4e5ca246d2465089d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:559a35fc775cea1bf3d6b70510a1830ad24faadf75116d25227e48c3a7e8ad0c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f073f072101ea94a9f9da9c524c52141822cecc9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5db1ecc345289b209b4a8f98eaeeb3ecdff5dd15a9ae8fee9b3679f26aad22b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9315acb670fbb1ace445e31959145d550aec50d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:073b9490f955bb3722b69978f6f3f81349b41c7247c15ea1bfcb73dd1c36027d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68ef0f335a7fdb9e2313cf08e834798d422b9e7c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac44adaecb8a93a21b116d16cc7ee43666f54a33adf057cc27e70329593efe6b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fc8c29681f89a49be0b78f38c82a308f846051c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f177961e5872c07209b295b2ea6b32d35305e1f5849c3fc77e5e32e45e291c17 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a38fd95c526ee1200747ecccf9afeb9f18a4b86f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec46f07ecc385a84c5cc0b1f80e97d4ebe45bf1821e80cb39d1f085841ae452f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa1c966ab627bf8079a7795a3a0c254602328f75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa08b5f27b7c1edb7342c400eef6319e731d39359136bf1b4ce4ac6d7014ece1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4995fe5facfe329ee0ad18c9e6238ab422f1b5dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49fc3c4df5685a73fb0836fa6534626e39946dd6557c4043230ec1ab7c75bce9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19d122ebdd06f5c524331154af8dcc5289134524 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e107f4d22c9d38e2acddb99f1bd777432727ffc18f475da984f190650c54721 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeb3cbef64e2a33bc80d2c53b0db97294928ec07 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c6ceab48376819b735165f03a875033428399a70e0eced086d42176db3f0910 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..839f1ffb698288e702ceafc327aa699a5d327700 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:304de5051780e9fe4dd1c258396f0ea8f83631328a9abc35a797da4b08d59384 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10722b4f0302ad3a97b51dc0caf178eb3ecafdbe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a7c704469ecb74a63cef9756e6403e123c048ab4e93deca5797f801f6de6c19 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9992716c096e593ae8586dc3aa4bf7f0a80542b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40d008039706573e3b535ac4b7422287c2782a5541bebca4ddb5c616483a7e19 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bf12425126b047b6c8d2d3b040d89c4a5e4ad99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82554eb96619cb54c483e1239accee3288cec157ed7ee1e9f9b176fbb03de0f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6040ffc55ca17f2b5b3df49fd2365ab408597ac8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7578fa2eb472918f0dee205229b287a2ab7d48460fd99fabf2bbf708d32aaff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f43f1bde2ddb47bcd350d44790a9c9a019f832a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df9fbb42bf2be97a78e7f9d33010edf599cddd339845e0320c4537b796c7c244 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfa156c97690999ce496a10a7dc651d83a35b4ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e3c5c45cf74dd5c2ba250b7e4303b27175e38ab47371e4d5ddc85c9ed11d19c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9726739388061d1ca6539680dde81dcf8a9db75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14cf2899bd970d768bd914f1721c263815fb2a243a091b40b13cd112cf3e277d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6efca170e73cbfe96e20dd7afcc480cc4386097 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10bca6d4c52e48286ef81ba0f3abbba0b8251bed4a82d3b95632e9332e071cc6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00c3ebc8f60633529378626bc03e4d467d458517 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:607bc65ecd6223ad9fa2547aab37bf260bfdd412b1282affe28fc09eb350dcf7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9df566db13531df66d445f7867d9511c1bfb8401 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c2509c28bfdaf7eab8bc2ff4fe70ea0548dd1668c031ce2df96e4f0cf986f86 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61c5255bf53469000fde0eb7cd07fd1113f89784 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b44c76152772bd99ebf6a26d599d853c16a2041c473936c6e982ff75633a3129 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0168e6f106b2241fc58e6bc5c5dcbcb1593ac01d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb261b4a50030bca5398b8308b6a219c4ffaa4e7810d7cc3c723a3070ccace9d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e527c2c24a8f3ee83a3bf3f90bf95a52b156f83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3637a651a869efc8e3f99742c06065f5f8d3c5bc58f8c55cf3575424c74828d0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65d0bf752bd657b83b63aa9004d1c8a693be76c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b0fd85b1341a90057ac4766e383e09315b3349a464bceca1a0d112b450ccdd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..389fe9b2c3e3d996000a9386f44ccd8b69797a99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa4814a78dc4bcc0ce163d5fca0e7e780978c42fd1555fb38ed38b5b7d0f5fc4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa928a27044a455b52f4b94688026d0158c00190 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c42106821db2e3e704a88d297dd3af21cfe48b7106b7f32dc0df2a1bcb1e608 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88f9e3dbcc32a2620626eb1417d9ce98f80798df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42065ceb1dbeeb5f92e4fc05d74309b90f7f14c0e8cf9feeb51d307026d2e731 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8f9a941861d187e931466eb5f322ed1b1470eb3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98d68d5f421cb2edb5a95b4001fd24e8a44b9914382173df7ddc60137c245d81 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65e8a81d8abab2263f47ea099be1b65d212b72d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f6cb1548962a474a73e02c91efd3e2692a6fc84ab87eeb47148cc099e7df3f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d103c735cb3e2ffe8df49351874823e42e60d1bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6daf4298f3bc3474952962d3d1869c5a829534c5059a9c28881c15e26170b15 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e86a6f2114089952e6d013d521f9c1a8cd20e63 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6795b5f8d95a2f1288be344069c7bd36cc6a604a3ad7366999baccd7a963afe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2685f6245a7d1fdfc962437e476976ed62010fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa9fa2be8540945da5ababc5a2700fab3d1c8dd9a933e1d87f8fc768cc774713 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d06cf4698f79380b88135be440ac53ed7dab36de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf6b4cf8e2e6ed36e3d07e2b074ebe7c722132f7c68f66f8bb6d5583cadf7517 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f2fd8b220a94c1c6258ff87bd53372a4ae040c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88bc1e16ee80d8413f7e1f04037ce79c3c55bc820b67a2bfa335dedbab214534 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e16776d7a6c3f50dbbe62570a7a589b50031f1b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84710fa2241e3f0947d91296b60aa8c6167233b4a895601490f7af6face87954 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f96c29272e723390899d8cd969b77fd915aaf0ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9526c9ed5c8412dcf291a59ddc206a518a2720445343b0b1648aabf227ba1147 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c034def35978546279a8e9688078deb556fc18b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1836b527f99c752fe1a21d5e82a43cd60e017cd16076dbf65086fb289359c286 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6145a3af7f3c7d17c18d432b33fb9461c2e46e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a1152b89f96f9b54b2ce81c8febf663f890258aa35714fda49b5cd3d64abfd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d23da7a2f6036a90a5cfc27e122eda2357844008 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a3b95acc401bef7a66698e7f2f6923c6953c8b974312ffc3fd3b088f59c07fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6e63e3ee30b1124cc92b4889c61002d6fd9779e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e1766db22af6aaa33f4a328f6b0c2047b68954e7ef085214566953a556f5161 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..973e8027a3f4624807313c36d696d26ea50a6f85 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4acee0ba18d9f8cd73fb592f0f6f12e2ae5ea9bb3b069c81fb4f77b8b5786c61 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3552027fb8a9490be26742c9ca1817d4e02d71d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:809105c4c8d462d245d638264a1b0cb7f90a42d1096bd194b1e31d7483ef2e13 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce89014d34d03df9cb05b864bfea7c124261f57b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65c51244203522d93a4c9b689eb76a456512c392195c06e05d8b6c38c117769a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35fd69857079e517a92479bab9dfcd50465cc75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92fe9a502185e320fc068d67cd6c79628e9e7f8de16add8f5e73c09c73ab3b34 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3706d2d3789918af8297a73d817d1f9c3d9e3a53 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e5967e95cf8bc489c082a3a78c6e425715739618de48a59be153fbf4abd05ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f5588ab7b920d3819fbabf89c60b04d357060dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:398ac1037bb1e9ae6aa346c48b354680b94ea805e03efeaad6da6dd59a775bd0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d186bcb8bfde2ac5c12a32f5762516e2cf9188b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea96d96994025cab65a675fea65d7c3f872d652288e9533926663752e7a4488 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eeee66f05dcdd1fe5b7e2fda380aaa3933e94c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e50ae63a029b9263399264c1b6ea4db24dc0901ee335b3e152441bd6bd83e383 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50c9912707cb6274041f1dfd0481b3a421d820ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:769f3544f187cfbbe6ece0b0304761088ed0bc34a9188fcf56aef8ea80e56bb8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaac1f16d26ca0bc6c384335d8f7acadbc556d41 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5d71e96ffaca3c21e12956ab55ceac0bb7fc97d573f83b11f2ee5da733fe26 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24597960926edd96cfdcd080eab7476b1e4ec102 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eefde7dc9d60ce250a754e49a5769275775273d7c6bb783de9203d2b6293c13f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22a9b03976e22e64bfda2e4ed76d46addfac7c08 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a16149290ebd5d325428d6f9a691a32e3a6336bc167882f82bfad9ea2c5ae021 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e69615ad48ece3f590452347ae4de8897bd07c99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:955a204b31fc997859e55787eeafe0b7a70c2d7b82ec689e1b1bdcf1bcc5edc9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a3a9da668e03e2365307dc9c659e2d091f45e99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd3ce74e2e4c33a6777b85dca6f71aea288cb2205112392364522f5f5cd7bfb6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..584135478e5e91926f3b9251a32446086262b14a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94c046e7272095b092401d601b73376246c6612a26680ba81922b4bbb3369df7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2c1d4b23b1e99302558e4667ae2de1ac060d458 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7130c101b2bed0049e2e123bd4521659aaf1c1d2d4efb9041190a9440a9280a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f0b97c4d519f94f97507a3261456acfc524f961 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdbf8b422bb481e30b62dc9d4283e3132d4601d6ce8be90d1e5c24047da7a281 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e23ee1c3cfb28b479ae11dd2d0be68b909910a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc593a32eb58cc32f77412cc35932538567b04b2401d177126e048be9b225bf7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d922b4097978e9eed4e488fcb15e5f9d41b62b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e38c07ab3cbcef67c4692fe7bc7a2bc0c01c9371b6d5469acb21c07340ac4916 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d867b152a0cf46af3228c08fa8191a1482b82d60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80d4f35a834f051fc03d8c63b0a3f3e31ec08878e68ffca14b8f4fb492c7e74f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f40e910bc375a61b3820c47a196190336f7f003 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec0edd006ad55be47dfe08fa155ce94fe13a0817208ed0f04eda5869653336f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf205ad0d3db65643c837bc0745cb09485c10361 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e6d5fe0ba0da8a036af0259f7f8ff14a81f08422d230f938abc3d55e298006a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..498ab8ee0c29b073ea85a29d2ca90871f0dff1a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164a3437dcd25bc13a993782fd4480c9b158023352fff63e544c4ea6ae04a9c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5640bb53ed08262c5526dc532fcaa119f6bd3b7b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da87d9813bc86e11782598c20113443cbc46eae4c55dacb8a046945027a8f466 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..203114d396f8067636109f96322e98a596694d4f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8462a29759c98246a66df99bba8bc76d419702f694bacac3f0b8eae3ff6c4d85 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f21a1e91cb9535d56c956453a929332754d98b20 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2012783b6e8f4f30d8afd1ca829c4ea865998b84126ae9080f2afaa915f9c6fc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95010b859d8c4e0efb6a79374c46987b7b35eb4f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8d95dc091c771175c63c31219f801c02fa5f3e04f68fff3639fa6ccdca6990c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f53d5315a3384b95b1eddb55e7f3043ca772c6cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af511cc23aceee453d42194ea1bb369574dad833040b488e4ee229962f507bf8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..128a41685dbc5d7a00a22ec031448b87a4547613 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330517838937829c43312a8492cb1f1c5a442b098d22b3a1de32b60fa3f45e77 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1f107a5a66afdf4dc792e5b361d8f4cbf0cb801 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4aafa7a00859a16862163ac9b56b52d9772640faead6bc9a20f3717c6710433 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfad937436b3f41d153bbf59258b1077603765b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb97debaa8c7f35a24fa360691b4134abcce027f48fe08be76c89700ea531cc0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0367bbf84f7cb6bc0c3bce7cc9fcc9b8f78b0909 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a25a911e54c05d1a1e80edf3d28724dcfe7751a2d4da3bc5ed4b6beba12cd7d1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce54c647c1c8920fd592e7e8a275fe0f0b20092b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd961fabc2587118cc290644593ef12905fe29d38e8050f70c7a8772e4d1458e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56d3d5b8b708db3b642052c71c86b30b6c757874 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e1053fd99ef80d329fca3f1fdcd1d998d9d78cb54265ee1e68fa5f130510083 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9fc8d0ef819fe47659d059630367dbdbc67ed87 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9339b40c2eff87a883979c96db778166276fb7055015c5a5a027ca00720b0d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..609c05eaf13af36768bf11bc56f01d20abb58e3e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6b10b451f40d1c537918429ab514fd660e15731f2e242cded4e72af443b78dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64c59fa7b1231b7d086b2cc0d998d5f93c832102 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8499643f874653a3e568360cb6927656b6492c208a11b84ad0d02e219bd62cd1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad04de13526a9a083fd9467e15e5358d5d3bcf14 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82fdd9a82767018811f5e88cc0cb6b95d49791bd702939ddfc508c47d6e17078 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00b36fe0386d7b106816de1bc1a33309fc105b3f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7a7f7598a60fd014a6fec1cbd461824a7b936183dedc0137cd6ceeb9d4a4b00 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac2ffc118eae862d873b39743e4163f986a5f264 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6d1d8b93501219b23ded254a3f9c9f5a07d2f3f37800085757a9ed5c01905ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29857f2f58f482c7db14c627a5cd423cdf486b53 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38c5164fe27ce699d84d3b80d9997a0b8f25c547b3c55f4e53ef8a374e18cf28 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee853d93c7aaba4f2dcd6d270665a616c5c41e83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bec262f9c8965fa8cf8988cf98df458b189dddfb9599d71e1037ead89e984403 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78269b57acec759eb2f022a54544998c3b6f171b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb39c589a55c41ddebda8227de9b4c8e9f0f8069ccc293ac5d8463af0bcb5d27 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7229c9fff6c290f6a04469e9d4a4e4109161526 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc874da1e9fcffadcbe7972ea021b3e93828c42a8917b44825d3dc6afefabb55 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..401451d57d6a58cbf27aa397c156964588f3a998 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb5bdb8cd090cb280ac197627c5695f6d9261fd7671d76bf8fd18bda47e9ef25 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28a6ec94e5c55f4bd6147778cee798be20a4b5a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ad2799c41396a32113e2ee6c618aaf2ace6cf64f388e9a53f11451f61c8b050 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..264735bfbe6fe73693e2746b158a24857fa3dc53 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7807c45d1a2fe21c4735b113f5cc46932143eea7b95cd486847e041a1f2d191c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0095efac65b8ee7353d24a5b3d770ed26317b746 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47156962ae21248b7d845cccf6f96a21cee6024e57d33c95eb47c87354697e7a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f88a07720977eb3f4133e1b1e5892d312ce2c1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e21dfc53802cb3043b5620cae7fd53a1fe0a889f48d12ad877f0d24dcd6050a4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76afcd62d3162440b3681f4d8cc943d0dd87cf0f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:547411b38bb15c9d1560bef75c84768c2fbe5bc93ffc6c4a7fb888fca7763a4a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..831fd82aee76a3fd328469286affcd0a9ce518c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96ee669cac70eb8ca6a7fc0992f42f233442826b5372f13a961a00f6cb5eeb4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b0f5743311e359c0eab1283af3d603cf306d0f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f32d848d4a262480d0c58e033f888f80333266d1f775d621b4040f4aee35690c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87ef7de3b89e02ed7f652854b4e3945bbd49631c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eed2c62b4440b50740782805ce0005a75bff15e883cc2bdb59911abd5d872b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..936f0e38e1846746d992a7040b2d1211f00be3b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e86f70ac97776ae089cd3606c3739479ef106e941ddaf604aa530ce9372a3110 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94263051f917cae1ea4a8fa886935f6f0fe34649 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:202e8d42a22e140a382fde5b73019d7300171c14373e7b1667acf76e3e285e86 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b0b8120dd727b3c634b7cb0b9f2dfb2a3be2cba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af57528f670d2357b05aadaf5a07da5cc98a3b8726021cd97ca8b5b628e20338 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce0e494d49aa550b70bfcd6e4e6685d84ccf741f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fa45ed8eb990d63965eb60e9f4ed279451381607ac42e5ee9043b4513d66281 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd8cb026ba2d6c804efc0db3d0b57b967df61303 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc34d98cc250213cb0464af52e1bdc218b40606f30dd8089ef9cce2c23ca9051 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7739c5b3ae2cd038e6c112f5670e6d2d2e3dfa3d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38885c6c4b477295bf6b212aad77e03c430a4246091a187a3dc24d624b47bb32 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18edbea51105530c284c9f6899a099b2ec78c0ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f938bc8a15307f7afe9152cfc6bca897c565890ea3f47da7c39b2f45573c60 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52e0b65eb081181230f07f703b8a6a038a77a950 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f22264e72dcef51a627c306d03cf6fdac5927fa324b9e6e013ed0b81c5bd3bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d7bdad50127df8b5ca024aa91b82fe2d63b08ca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49e7dfe7c2100c0c56615621ab536014d78d43258309f5b955b5c6d981754cad +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee88c7d1a6201f3a84002ac25c4941132f8b2412 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1917e5262de8f06236dac5062e5a08bd11c140a42b59eee2504f1e71ee2caf75 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe0105c3ffe1d1fbefe9c213147de90430fd4f0d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:754499be8638b2efeb05cfb94900ea85caef19ea3def84f18a4d286bf8f2c97c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a71ab0242cfcf5c078ebf2beec7a552776a2ab84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6c2c213ac1cbe226597cc69173343455bcea3080cd3cc91bd84815fc532046d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b367d8d132e2f82c606393315459d57c9602220 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23d478fe2894e43a3c3472d655e71787b39550dcad4137ce9bee1cb03e810bfb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac22e7c2b2ccabe716f0c8561a5dd2e7d51718a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b22968ca8777f355d33a20146d9032201facad7068fb4d4476d752b958294a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b249200f65496b74a755eccd3d74c0cdb17744a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cea77aac085ec61851397642284864375a9a005662c21edcfd64dbc42059bb24 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f7dbe2f4f1d9ab7f6d8d67e2ada40e8e1d5f7cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a9fba73d83af46f80d381d917103368940e35da2b662365193340f0dc5d6fd8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..421bbab6d946ddfe1385b147e2b5b7d932696da6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9ea8e3e4f56f7bfcec5c15e6ac7cbd72c5b222e2b14c06a805c13a11b8422e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a90b202787478e9eda7feb7048785e3398fc14c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcd9fd0b53d42ef3777cd93e9939a9308bcf648396705c360fb1672f77e7dfcd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6307d1d9813c6681f7079ea7d9280eccda459e55 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e835b3b7eceb5220e6b185c45ddbc6acc75c8ecc9dc4c08246936f6135ffaf8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccc21b0f59cfeb6b0eef93f00013f87993e226d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfd369859ad626e34b73de59884063d5ad37e5d15da10d058c0ee1ec84641647 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66fd82584da9276bb8f80635887784969ba5f9d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:470d82ba8c6aaacae904965adf186022423173f14f42a99f65c5565530821eb5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..804f2d0376f885bf7b2c19df2d34cb8ec64eb0cb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57b29b06553648269881d7742530fb761b22372bce5b5e25ecdd4dc07195602d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10a9fb232da74e0cde0642aa24706e71386a0e48 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9485b959ce03edbfcb1e599ea49d865a7f75b68bd3002056972126264a3fd92 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d55d1d87c439ae3d67d3c3cf645c0e9a36c3ad9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75b0d5ba0919f022037bf89d2e53a301e7ab5e5cf192b99b8a62a1490e3e7335 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dcb5d4ea785346ad6f0b04c291523f9ef178a4b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8d37fa27af73551f20a192ba7c98ab3cca3a3dc7f8b23706caa427df53fb21b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d98491cabfe0e83f1230dff337658d08138a698 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d54c8b3da5e2d9f1b7c4a1f2a8072a119335b2475ab2ad0602312bee34502252 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7a46b2856ef2cd2d9263c1049b6a601596704c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11680b6b6a618c6f1b62483a529c6dc419b5f61b6e6b0902b2a2c58713c1d405 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f500c5848e9a9180a8eb5fd0955e443b127bab68 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a49d3fb1d5617634513a575bddd676361f680b8b2e6bd66071f511506b803f9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8b7bbfd46c0707f703d95e47ec229ca46c1c330 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:904eb8adff5b215c3e506174796b0d92bf732de61a9a8981ecee2abfe6532f26 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab0f1c1cddcdd4041b5c9d003d804a3ee5548b3e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7640df859a8e843a7cb3fb8a4e74167f720db82de9f84549b17a8fa0b1c6b5ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d985eefe76bcc735c220e6c1965a2615d305ba49 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2731c370c17b0c1537587691e782df27eab4ee51586f64b3fdcd210a808ffe0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..211cc9135d1b6b8fc2530af2e38e0337d7812f13 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c831bbabe3853de5383048ed3bd3bcece3c38b0f95cd6940754cee5a99a42de6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c54002b7834185b68fa09aadc46bb6988200f73 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bd1a543ae45bb4ad0601555e8f04b052bd00dda80854f03a23e5f1b9fc8ef35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..849878adafd42dc2b3ff10ead84b43c462cccc32 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d552c7d8566e5e5247147d19f7206ccb4555345b078280c61613447262a2b289 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c189570f293854842eac938efae5f96ac6634fa7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b8162bf32e0a03dcbae916d0346a93de42df22b804d006ab914e8507aa528f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de86bb22d71a6c6fcdace4ca0737c4b39baeea29 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c31898a20c0f37f046d31e30d46f06cdbbe3a85c8e8ca3d886f5e1d8c0a346ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a26fce6a20229320bef8603b9ca73807ec704b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eae9bcb08529ff43e2ab17e7d7f1406ea087857a142aed964b6e2ccf27c98ea7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..084dfa5173ea3af6baedc79fe56fb13094665985 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be4d6fe13ab4227a77efc2b075d59aba4219de083b79f42e0ad9ed581aff7ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa89ea48475c5ace03864dcb9e71ae8090525934 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac85ff48adb60f472e9fd0acecd2cce316307fb9665bae95b8650bcfe4dd4e50 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e56ba5d9cb787e1deb7df8b98cb417f5478e1527 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b3e1df44cf7a59c7ac7eb2cd5632a393398e0495e51747e5479348cdf4b362d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb22176fe2b7bc15f0bc36acc88ea42bddfe6e9e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca9b2c1fdb57671e9520989aba4655d53b5715c369f7eba31714bdd67b28bc0c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f4a8ed1260c1b578225fefff06a17c4ceb420f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d703f5f8c6c951a03dace872f2e41e954fe1f424f6840e579295c7eb5c28982 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..097a7f117725443475e856cc80bac813df66aada --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6648b1a393df34a9bffc80cd66f7b35a5c40e80934a347435d4c19faf224749d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b96b85e10ed389edf144600c127b623235e67778 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9ca1aef0a14c5e3c986a04b6c4f80111e9241b4c1be027eb7ced33a397d7495 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06f4603c22d8e305b2c863ce27f35970898b095b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc493341114e1798786ef10a5f34cc0c84b4f21a5c7bb6da1e2c0ece257f3520 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..714e7a41418e98cedce44f928fc63c0e003ca448 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464635959e9c515e58c783e54bb90186a82f92e1048ba26df4662b9a7667f5eb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb4d71d2a1a81079d9115c8ae1cd50e625052cc2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b76c2da780ae9d06361dc3aadc38ca34db14dc60cde5bcaaf3dd487230c4dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50a1b9d81c5035c461ee8c83e2243656b3c1bac1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79df8912e92e9dd1a0327db2b6674139cb3ddd42ef8110effa54dfd4c7f2876a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..464ad86070ef9f4e5a4cdf2eb345d4ed38cfa9fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d70b462900c4e65f38533b7c6cfd2b3b68323ba4669fe96dbaea7c8bb50966f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b92d5c5374a2e0b62da7f020a8368151341b3bd1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aba02ca2515e532ac87d2808b0497d5e7cce4a091c902e939fa736e7dcb54b95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cad57850d26b9f9f4cf478cdfb187274addaf6d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e173ac53e112d1aa2e40cb5f87e671062fb4fcee5e11968ca514847bd18288c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..964c2e53397588eef1af5b965bc153b6fd81ad67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:866f9c6c04853b51ff9cc059ce9aeef54fc2b9b7b8f0895c96a058bcf32e13d0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7fe5b1e66a146523156a4084c11b1290ebb38ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c83938139331dfd226cf7ad73e285586f2d168dc38b6162cbce4b857487c4d6d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0990ae20b3d40f07b8888399746d9b28fa794947 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b837fed149a87b299d4738aa71aa39dfd4041a4041d516b16c10953cfb796bf7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c178246871e25dc3730877922aceb78761df2cca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dafcefbba94ad20a11d4b15b007d5a0d7e1a79166d234f2d046167314bb4c048 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e9ff891cc27cafb0b8c2b49e139b1c8c734c2ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99420a58d77bc10ce0128e879bcb88d3dcd6b4747216de7a086dc6002e4d77c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b3bdb8f69c8a76fa98115ea06f40bc6218a07f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9141dcb94756c15987ee10096db314f10c52abb493cce5956a1af16c7f7562b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff9f9aaea386e10300f2c72ec3ba6b96b11353d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37544933e47895a4dbc4717fc5e4e417f66fba2027aa04e23cc5a24236dc8d27 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c5c271b59358031caf637d22ace2a91616ddb79 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d709e44428ce58fb5ef92a8093b704d7d08bba1e05baaa49e3a984e887eff30 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..35634b9f4a8e44a14f94727af1a974b3d029ff75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39351836a4d07f53bc486e8088d02b2154b6248b27dc3b0ae6e2015de01fcde5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d67c9aee79fd92a890709a9d02767e1f8f80126d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61b334016bb1dd1ac39d06d12fea775dfb0b5e58edf214c28d56d8c5d94bfb09 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..599d1e406221b6c62e78d926ac9a3ddf88be34e0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28502b681cb037a99bb5c3f63025893b1cbb98131404f70d4446d7be796a231d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8de3be69176ff769e873ce87e5f1610f24250b3b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0aedd4e3c0f12dfcf2567a8abd16bd8749bd99cbbcde630aa9b9bec8093cdf6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81ced01d3457b9e77ba03689b191e3e6f0c25830 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07df8764cb28eaf7ff89bf20d1871b48c0ba643fa963a7a6d0de5fd87f22a3df +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..047faa468805d05c02b50f725a42658cbe110ed3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e38b93912f661acf588af9177be88fe2229e85a134070ee9535fdeefd2b350e8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db957ad9e9c62637aab8330feae1931ab6768fce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4274615c90e47d3be1f9036863d02ff2152a8107da9cf02bb6ed21bf5edb0fb6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9315d9019c40c24083c0aa59e29b46c9dcd1ba9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0643a15c3c28ce497a49ada338e9d00dc06e404aa28dda73989d53b6489fd094 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7dc871af054f9c7477211036557eebc1d300b28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:915a377705a90b233a0cb711518f60671cba46e75f6eed69f4a8bac70625c74c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..632afafe2813d82a09c1aa22868f4b3d894eac44 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0999bd24921418c45bd934a0a592de716a485aa5bc6c36d34e584a0119023a7e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba42f89dea4527318d6074788c693b7915da2839 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c73bed80928046df0c387ace77b6c9f4abff503442dd8945b74417821399ead2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..901fed69647570a4d09e8c5b25cdaf3748091d89 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892455fdc40c472179529c22e5be83867a44cb1cad592b9fb21f9c567ab8fcbc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbe376c55be1b1c8596dd960c196cdafdbe4aeac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:225b28ee2ac5f1ab08ab0e70a96b44d1bcb7ecc705a2499e89a27ea9e20da509 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d76002136cf14bc21079da1cc1e6aa40b071045c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224a59305936ffec57187cbf2f31cefb66f59d2f6b8460e4353333025cc1f6f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bacef0479ad9b732614705c27837266bba9cbede --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7596f161165cc16a4e390d67ad1be312dfaf2574831cb83bde8b0ab57034a65d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28ed9faf0b9f1b4e0e50a9c1f138b49189e84fba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f2601a36902600a9d6fa41ea5921b00970107305f004091c0d694433ccd2e00 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd77515fcd11e501a32f039562cab1ed3a3dadb1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7e127df1e74f7d098d3b5bfc7f08bf0d6e0a7555d0ac7ebda34f6bb0e2371a7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5582875e3e86217eed6489bb6e3dfabf27a6d94e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c667477639e7b519e254395cbeccfcbb4022169cd3adb4a361ec88e498c190d0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7b1cba08ec63d0daa25b130fe81b59cfd998a82 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb863ba212c40d980863cf94ba650600badd013afe315be5eef2af12db659bba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c39ad7ef71eb80a803f24dd760077151bf7bb62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66a021347fd60cb0563a4017b1aacc2329aa588d95089b74b48aea677fe68f77 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52bb4132c9779ada0ae6d705e1b167cb7adab25d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9541fcf36df544a66251144b6b3eb0f8245e219df2adf0799b485a128850d9f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d01ef71f7c742a032b287254fdc89fcee625c271 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25f59881bd055711db1b055056f025da0f5add01cb30908cd34d926979ed8408 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58f2abc5eae465e89524cf64197d0d2b4e4cefff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d735d33962243b2d7a892ca5f097bdbf32505a60ec609419815b7e4c731644d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb4b8df5b6b6a03b6587121e3a4e160419895ed6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc173fdd348a28a7a6afe412b535f6044115ef6cbabed8c151a5763c26f00b95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a2fb51258ff0a4022737c358a43e068a874e935 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b113e01b710acca478152701cb06d786490b86e7cd590a5d26f787615e41961 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cc0903e57e68209db8d6361a94ac265838251c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5326fcde7666532e4efc2ee6673504916a83253a778fe3ab7cef0b169310bf38 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0ec2b2f96000e14b8b76a83ef4b7de943304b8e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7ea4e75ff12e0dc05c151d113d30092a1db09a8f8577910abca73b722f94bf9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f3db9280ae27c6723cf166f90ef99cd540e2c36 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30e44b2d80594d3040e5fadd0bdc15f6efa05d5d528d34932da0cb0cd567ff93 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f3e2a55a3bc796518b9c6814d27948d20a46e28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e02bfcbb7c0166bf85fe8e325e1a58c0ce1f813362098b1993276876defecf7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d187e28d9b67b247d3b4b6466eaf371d8233429 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49c23d21de95ce593561c23ad81c6c798242ef40d1beb54421b408e88581f5bd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38deba25ebd58f6e55ec30a78cfe3b3ee6a3c9e0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c17648b1a7e14ddcbcda5d17bf70fb48705d7263cc87d023bed302aa5c3ba91 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1c9c1f15e76530a3c516de31d66eb9f5b71e44f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c4db8abcf2610c934284b08aa5bd490fefc1979ece135b9038c411066a1a10 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47d871c3f2ed3e4efc38c2d6dba7b5e6d1904932 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57f8f231ca2eda95e340ab30f26f0a6ee15ce5fc4493b8b2ec323f960b7a1c6f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0627ef6a1de78850fba273784e0e32403caf5fdb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d81ec74e2f4df44275664e99a761f09c42adc9422e4f5f0fec26ff2b48ab3c1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..267c6e63dae3e7497dc791fe10d07b8aaf752137 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b3ae5ae7a0c852377eb983c222ba93642b945ab920f3cb1d783a39ec2c52ff2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bbc9532ac72166941b41cafdc440f80b0931da7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66f99b5529126cd9bacc004d51cdc5b8f94870a172221c8b85223365d55ae995 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5bb7b670f1736de77c475c50aa324ace98206b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52c0df48a334d51587d5f06c8bb690460fdf3a8a2917d055f93597b55e8c5c50 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb7df1a65d78c508d5fda4bc721ec40c1d679dc8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a250f2c923c97dbc9867783551b81bbc5e0342cefff89bd8b286456a9b80c2f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98c85f3f20c505b855cd7b5aeb822be865bb8b55 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6fdba248ea2dee84e1b7a5945d2013d24fdd8ba73250c8dca49feaae3cc36e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ed9446019ba51339e6fc0e28e5340c857cefc16 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0712abaaece279dc18d7b2a76914fb935437d5aec6618a71ec0d326935a4d49d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bd957a2179c3d69baf0807cc595502de9d50486 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f066526372f0f72f9d22b124b05eae8f1b693c8f0b3e205848788d729744f7a6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad04f7806b30a0770303390610dea7ab923d62e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99f5767e33ff9effc058c1dc4f4f81a24ada8e0a9bb3840130722bd978fab170 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a153bb35585c7cb3ea60a5c1ca77bda21f16dc89 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c9f28a4b7268fc7643a1c4d916bc9b9aab685d5f49a8484d8ac7a5512644bc1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15784f31981def96b68724f3536371d81557c7f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a0a0cd7e3ede3fefda2f04dd013c8855c0f0ab0896ac3d92b5108004a917707 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae2722d34734168b53d3934a2957eb7045cf190e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9e7814b695b821abc64618f8019ac82ea19ef126a210f1a83921692c386bec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72343fda3ed14d14d300447f7125941bf681a352 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faef59df410b6136ff8b0588e2ee444af60f75802ba485a112f8cc71dc5de870 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e99c606692b96d6f7e477f710806b63fd0aef2d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd37de30ca11aa7fdd73ba72f25e8b9996d919c77feddf44c3708896f2efcc85 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1372fa8a51e80182650e08581727e5cf92fba900 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caccd38f3b0dab09b92a1e51083719bdffa5b4165b26f826de6dcb958beaddbe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d05930669baa13a5426a8a5a7f00067486c03f9f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0707780272c4744cebb070c7efbdec4a7eea487bc13480bfc6829a4239bd317d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db332654f3ecefca69a6ef0ac3f22115aae5ce15 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a832b1dcfe44ef4f396a5a8b642fa2d21c8a25a43a414f3216f453573fa6c933 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd14890a25fabae2054ff4e9698349d0638e7c75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29b3ee7797b98ddcbf9ee548270be06d31477d6b7160558fe34ef2f36ac20849 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..670c8e6143ec9fd70e3ec9f462ba038ac6348cd9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d0edf32b52218982bb8e5b60226002ff6a718b145d064f971b9dd026527cfe4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc7b223bb12d4e4486f2ec8ee89c090dee55d239 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40eb8cf362c388bf1f0d4a347551b3d261ee927a546b5d53596f2aac203893cb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be91dcfe25f034c6914cd0071de8066d1b05ee50 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6a555a2fcdc81d4c34e8c37c2d0bc92ddeb64017f0239c5b9c7f46f037e7285 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4a11d58f264c62434b32a40d72a4c7c230e9a8e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9e428903ec10a079a3cff3d5e66fc05b44c7f402d192706f4a76827829b66e0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8434eb0a4545c2b91fd2cf09f6b6605b21a867b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e1b2b0d12d4cf2b9ff9f00596854a6cb9ca538432840c214c336acb1876598 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e75ad6139eab3e8a0b027f92e708e0fa1fcbad4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ea8028c2f1d4e30614ff8ab09e9ca2593da0366f3ddf75ed6e02c3e982a48d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bac1be32559493696cd14919ad6fd4b0be87462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:947e1374a43232cf8c16048dc77f46eedd4e26b86da5463671eabcf17ef75ac2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..121eb7604f4422f6aa952b5c1c2bf61ef3c0ca8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e68446b3f4cd169cd04e05b8b04be3174669ac26398892b817b16e32ab360afc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50a83311af0af708929f56b84ff172aba4233ace --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a44814b292cfbffc2218e1ac1b9dac7cb22e83453e73618a254f9a58ac04c01 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85a3d3df8dc5562c2ab480daa902ceb429572ad0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c79b5c8d911b0750b8f965afd272480b4195422caabb5352eb87bcaaad3b3b55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e6ce8e16436cf9b52c4c7f6f78d6275a0a9c1b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d548a13a7c770e460376ee7cd89ca1f02ec22f4b147a818fdc071d653a50ed9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a373feed163a9d4f20c6edb9fd1545c5928f7d02 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b898090f90bd3c19ae9ce4cbb518588a9e43a379aec52000874ee10a16d417ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19894521775dd5c62a3229747766c14b6562f7d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:066544b1ea87515ad95c9a9612d5692a1d2c081f3815efcabd4b2b1866619a28 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dde3edcac52c77981a3f4e82468bb0f20f00c03 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5485eb19adc1f78d6cd50ff36ca8347beb3b7a95a516876e302f680c990da2e0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79be425c3ffbbe71f3593eb05e6604d376ece5a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:604f7e21523157de3287934fa4481273ac98ad10581f9a1dd10fae3d7b1478d7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0933bd5178a006783f1e3830e29f226c9781a323 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0c870a8846e9d776ad13de90248533fb8f325234e9e1cfad43d30877f501320 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec44e387db981470a1aef4f565f03b0616d1f7be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87d82f8d52b76044876efee4cd3541f7ba739993d02fe00d59895add27cafcc6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0da810e254ebbae7db8d245e49089df4ce78cd7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e409d17c2731bf0dae9c9439472f1c3b6e467df3d1341c8c29b6fdf7e46717cd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5278b6b1646410222ac9458f98b89a5cfe9170c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46fe8513a258385fafccb0e67a02939ec8c1d5defe5e735574da10e947f97e51 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1aa4cc867774fc3083ef57550e77816ae4903226 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ab7dbafca52bf0b8926b8fc4d31e0a717fd2bfcbaeb579648c8696a794f703a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fa960414047deb66a56c14097980c1d694ac101 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:642e7ff2bb6b7d2dbba720d7349baa54f195e958c0154525c33976cd27fc5911 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f9d14baa368c8b0fd2aee5552aced45f87cd7a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8975f33af99885e7f582bc1b2a8a69406b226b17e5d834241fdb7e77a7122a01 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f802413e29d37ee44d6a791fc67f5c449ba269a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af40c04e1a10ac8f27a3761e4efdcacd1ff16fc90c1a01b8de837b30c601759e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40aa6c44a435340b0888cc0d66946de947f1d709 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b895839f9b8b93ca4c641bac872071ca83804bfdfefcf101074f223c2e12c626 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc5a7f38797a3260bf149f9ee7352d2356d93b5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb66618d19a4bc5a3a7664b8f2fa0ff9a7c5e1c67c7f55e444b96f79192baacc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..437c6acdd001bb3e706546f4cde40bb1e0507e1b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a93faea7a29258edc3ac6343828dbc25e7e5749a6b7aaa219a263eb1199db35 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbc79be9f7de005e4feac642835eb7c7644ad7af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:748a40d673adf99b52e6e833c369200698ff3f065cd502958d897031fc4bb9c4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..666a2df4125bd6e2c095ca80a2773bbbed07bde6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fbc2e3b5ec624c525b7d230e820944c680eb8b4b168db083ad16c443d58faf6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a10c892407df01016fc2de33d6edf4a2b3eab76 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa55e9030ccd78c8a789b1e552ba121a808fc6014ba57e0ae30b3acda0d8be17 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea1a2bb1ecdcdf54ce2c7f438c9619b99d6f4439 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44e0c3c18a597eb0b29f30efdb0bfb0792f164541988439586bb1f3192f9efad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..372cb9b3599c30d83eb0da73e1f95ca0240e98a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4a6cba4bb7d1a77363605d39a9022eaa2f2a781f8cc86764e41f19dd0860e59 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45d1dd15bf04372006f6340544a44da282feddee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b3743ed62afd40b19fd485e5c6f20ad5d1682afb100fca99696e1ef49f4674b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58ae3de9e5abb086a65928d1ced3cfa9cbe8dfa4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ba1ed4578a7a952a97aaec0b2d7cad548773e940e0cc4120274ba1cf7bd11a3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4808290bf238bb777f649a40fb99ba39eac6a4c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc8100c7141ded77d62ab7bc17b3d5baedb189c657fc98b54b7a52333c44c081 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3230b1118f0a8a23e3cf3ab9aac605260fd424ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be20506504fc5194b8e552b591c80818856cf50ab56d798a88a17b546a493292 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22f11d506c3ce60b59b621270b2ec58eb298ab38 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e755909c408adcd91c6be3a3252a7901e22240679f61401fbcec4d259671fbc2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa1b3dc8dfb5d7709048da42211f565bc82a4ff6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5994838a222e03f031726c37beaf0b1d386fdff5d25fa59ad08bca6434e082b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04bc2184f118443d6a4fef55e36f78fd824cfe63 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43ea9ebfb97e539fc9af6b06bc49311c85f0046291d8ca206ce8152612ed5ec3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e743b01dcdb69454eef1f4b8f88ee9fc2e532d86 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22277bf1543c9808944bcae9d5933770b68c61c50987835fe24bb90824f23df0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcd5376a87a4662f1cc0d59639f3c885fa6ee32f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e29b428be1060953aa7b45c65bc36387234de7491eb642f3d786697f3949e7ec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f3a564200704aaa07751dee1b259b1045949593 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d5f812562eec71e7d6783c3f26a515f21b8ab880a12cb3262bf6a3fd1597522 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..698308d9d22976787b1c8ef11302b667d7364875 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91a8d0c9b6bc931960f19e7a4ede7cf233d6664bc094954af2616a3ae398a4e8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6b6e2952c5b26808335967ffc7e29e2e1855d3c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6052bddb64692d260ad2b53a7288da0295475197182c862268cc1bb94c46bbbc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee7629d5f3bac4616f050c798e45b0a7f7d20dbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e7e199d00e0ece777f6f7d4eb5ad30cf39d7ebc17187a84a36da0d9e4eb6cfc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86f7c1bccb0102b6ac2bd8f96c814a557437eea4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da34c9edcdb3ff21917eddc0ef1713f7a045a28c870788008b69725667fd68b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e069936257d5a22f6362b0251608fc1953df1076 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcbdb7f8bac64eeeb53ab412868438bab26d9ddac5b69103574f79cf29d44f46 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80a2ea24dc5b9061d6e293533e77e14243004ddf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a40d5d7758d6dcb3bc2415834625b62bf960a560ffcbdd4aece3f355cb8fffb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..682918140863cff028437a57407130473d07fcaa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:084f493fc77255ff3f2c230762aecf7dd92c78aa439dbc697b265d230cf2c9a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92717ac1d86919ca8ca4b09e48eea4f0c5c99ee8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb29698592802e50f58fea1f464827dfd24caae966e0131889ba1f69c0a283a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6553edcc58783fe518d56e6df3e5124139e22796 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea34ed27bcf661f62da3748592d35b093e6ee76a382ef2a9a7827e79d019ab4f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ec5c94cadba503a4239df3e5e100728caa8a354 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b625d951ed32a70452ae47d85ce989eed6ba1e8631bf6c3786f10abee5fdf4d4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d6cf8933eb56746f6d25cf1ac9fc94cf06c1aea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82f7c181a5b8d46550ff4e813ec9f7bc703899f425e04c275514512117261b6b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..732a93e29b3d9d961abff96b620082cf6ccb293a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5f9fe59e8b5ca1f402e8383cdc8061634d98431b58b846ec17c12a29b13f775 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..573fa3a6b1e2f8226fadffa14a843209602099b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0161bedec366165f15908d8a0d37b0b1e9195832daffc37e27740830e60a99 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46fc7a48f57f184376835ecc18502e745099eb29 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ed7d30467398169186370c81104fceeaa93a1c6c142e64b03d0a4025fce7a82 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dd61a1489c64a1777e4df776cd5c4aad1a0033c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b1168731f192e82ee0970a630a06feaa6737d0018ca1e2566c74676114c106b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceed0c0c7f59696150843b5194f496918a82c467 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a53c11bb6e6cf086f3b828daf65eb5850d521f390e9585c621580149ee594c5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8803682b0ca31274fe24a3b5f6773e0a514a63c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c54a0768fac2aa959dff41c62d784f3eecf467a57813fe7e645d77f773e8f6f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e2ddd2cafd985fa65ab9f158483c048551af519 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb2ea21823dd384751620fd5f8b05a13b6cbb11219738c471af77339bfbd01ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5d81a67f89f9b1f7d4ab81d40427d80146ef4dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df4a362e4f6505b848b02f86c537d5d4c562780b33e5186fecb98e8b12ddec6d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..971fa6f7abd0b7d2aa155d5f5ec14a19c2cf5779 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b72e7ee1fbea513bf6bb90f91e284b4b04bd660fe337a40c040011146ab86d4b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f054c8cda1dfc04bd646b5ddc25b94a5024dc95 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4c80a0a163eaaf330d4b86e98f68711f5e440633b14105ef8d891b2308ae445 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7f19efd3f05346f69a52ed3edab71226bb0313b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a56cea8ddbb4c896c24a1d46d848adc9e213e84409c6a0448dfd604a8f352943 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..815a8932419ebc2355ef452fab308223422d44cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdf7bd2cf74fb148c62a946c5708f5c2889a576b0f86b401b91ada207a06895a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..141e0204b776729133ce6bba51d8772728f8d6eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94da348a13ab78789deac78f0c15a5c4e044d43dae9412a27626b76eb0c36eb6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48d824cfcb43a87e78c748a9c36046608d8bd697 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff06c6a9555e731db23f553e15a2661bbcdb2064db6d067e683711bdd91d6033 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5654fde584b2611352f60e4d502d25fa9e2a0d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e537dd6eeebed014a4e6efdfe1bdf6b697246ae1d38567e65ffcc70df5ff6e05 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1206968eaa71fbe6e821fa24d55b641ce29d29f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e37d7dfe19ac23f6a9690a298856f497e11d81f2ae9f174d60e720926130f83 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88012d5801a429b4e15d746561f6768ca57f7b27 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:defaa797d1159e7ec14163e6355a1768c0744569b657ea2114b1978e1f48103a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb6f4f5ffb4b647b97f258498ded5b708341b3f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6615cdefc5c8e0575f3f249510a3cb0e1a827d62368082e9fbd7bcf10eb30f01 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b82c640555f07805d5ab25b24c99dfddbf38d2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fbbe596cb81131642cf68aa7785629d37913dd1effa6d69fe4699e6dcf06db2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21e06ea6cce8cd2ba7ad4782383403c2de07fd7a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eb8891e9afaa5f0a481098d9f34286e6d066dea4077c863d97151b6403f70c3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0d9511706d2915fe02ec9cf6b8607f7d9e45f5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce4214868416383dddd65ac2483103ec073a785de99957b8b2155ded73c11ff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ee43896323790a1999567f2b3b04c8566436eea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4608a5ff125fdf622e187406bbe5017e9a56a373e21b56f4ad38641038fef0dc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29803435f9aaf903841498a7ca217b6baa6ad9a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ed0a3f35dc296f3c588e9eeec2a6a72d8566d0c0e7464b803c2fd6dcab6f9f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cabb9706521b509dbf098075c144be8a3049d45 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bfe304ee302099492ab5ed91c90a9dd69ccde873d0bc97020eda3fedeea8065 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..35cb10e3031fd065aca33914a54dcb415d3a0401 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8316d3baeca20bf7668bddc924bd8fbf1ad4c855a589da78e8fc85545ec6b1da +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eed38929c73299e13a57964b3c0b5a3d66b975a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf2d021249346478d958faf9230f39fa0ff39284657b7cc6c20e1a5cc05c1c1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c4e3eb6024633aea402749af71e3bb16d0320f0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5dbcd1ca246a99de2aaba1bebf42b5483a0aa117300f454b9667117032b3f40 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39cc67efe68fd44f66a710ad29162f3158864b91 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b94ada213da7f764fd83d403de28db45dd8994c90afece54ed5c9ad67febbdd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc25d9c324f1c1a27426be9f8aa805c4dd5633f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a61a5f2a71c86f4a4c7583777042a298c704a25ebd86729dc379c21c48088e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4941f96692ac6422cf1ae3725b313628be7b80aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06187132c9214432c71a09d0cbb5fc7a71e47c7b51b35a6d0db070a5fdef25b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78da711d4ce34304d5c50e50cf151fa331c827eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc8e3f9724c1da33ce432b7b765fd25c5f99af003b22815769224edaf5362576 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..faa340d2ee99c467c3bbd8c2d89cf6d6096f7725 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b7f1e9ca9f156f6e2eb4d4725daba5300d96d62f7633932a39cc679bb63d453 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6207d51c52327252eb7df96d0cfa97b7c965d9c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2733c5204debfba53c9870d11e38470ac4d640d8f2eca5d2fd46d1c4ec60f965 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea09af2c5c768951e2ff105eec10ca325138acbe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e113e2675ebf928915e2df6623a9a8eb521274f6830e154476d5ad8c36841d91 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05d43c7be45724e55f85f54a101581596d9b3147 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:199e88ea2cde61dcf16dfdaf661d69cdcae9036ca92b4c38b511cc21cae0bfe9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c01118fc865ac70faae175be956fef6caaf49a23 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe82d0b2648ff207daf046e3a43895da08053e17d5390edf8efa5ecf971a4a6b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0be84b18b45885c238e4bdd23086645d56a0248 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63e27b88d4e3094b117fb92f09b4d0009e5825f2eb915f0b1efa8b3cca112cc4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93ccef01e6aa0b5e4e9e8abeb12740b0208538b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a311dc59f9c121d20acaef1cd5d5b46371c803f40b80a438f5dcfec123f81777 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92c859c0405ab126a8aa87f36be2a0eb8fdd66c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_2/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55a78ba33e84593d69652e94b7c9e36d6ae591714745b158fea8b1b00d0cb49 +size 11395