diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/lm_head/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ffcc80504b2a8c2382580028a78294bf11253bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a7a96655e1866ca27e8083357ae1a7c48bf7c253cf08e272c0818a84dbbce2 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d94deb070b85fb839813c59d1208338d6cff1da --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c7846bdcfe3a35e178fbb77b2deb9a1eca0442cb9fcf1fb0bbb549e8f1bbb2e +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b56795ef44965c093a70484a58f042f08a6060a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aeacabeea574f4cc3f09e9840ae2e801f7195777895ce9458311d17a2f4d933 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d866ca5d7c30e1501947119c3c29861472653a91 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8d6573f42159a582883ec31bbd1e6e63018de370a0a0f315b9859ba881a90d2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5b746cbb895795a135d8103a4fae0958683c9a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9839a80b252eed2841a82a2d17bdb08e2aff0691aa87669dcfc7123e5ed44224 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee1d4b710b62e5b8cb8d748493c950d325771779 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d2ae9f9fec94b8bf9d6b825d16793d1a2767862654e663cdceed83833d1633 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5007cc3ac4203d44d8bda20ea6dd686acfdea213 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8126beeb659ba5c91ea920bea1b66b714657120546f6a96195650c6245c0c0b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4694cf77bfcf2014760b23be9dfee9532aef386c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:042db0cee25b99bd0ca0a683c30698ae3620272af8908e3ea986bf00e71161ee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd36846f68791f530318f85edcbd00ddb68d54f2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fd6e4eec46c55d8f57ab770a198a5654ed35ffe80007e9983b8b303a80cac80 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39e0fd6da01c1a66562aebce4c92b132c09cafac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c19fa697f2b8a519a896ce70d4739e8a41a0187b5074170403f3c56cfdec25ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdebd537f0872e8ab1b91360533bb95d6fe08101 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb75d96ff2fbd4a4059d31044e4fe6eb0a897532d6d784ff8a05933470962ab +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cca1ca5f5956d21e8aaa058576c0089afc813694 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d27c9ff58e70739096b760248cbdcf14889a816f32c6371fdb1674dd2e56d972 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..95d97e3eb4497bbbe9655bb17f0fa7170e16d67a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c2f74a5ba5a3ce57f8305e5e5b5b1207fc930c6d4a1785eb57100b4c0529c15 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..425c128c2f018cf66da2738da51e4285511f08e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f42dba665f1a42282375fe4ecb662174fbf0fd0d11a5cf73ea5472e7597e586 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8e9df68862137dd3c08f3c46690c0f75ffbe4a6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49ade70013266b198989c62e7c3683a8896e43e1b0f3eb37b7270bd6189f5040 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3c7b7286bd0299c9ccfea2e2da68a2f93a58892 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fcd6581d0ebbf0da5cbe43a92b25ecb99e13c992970cec7cad1df1c077835b9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0421606263637bfdd86abd0903d2d212700d9c6c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:291244753b7d77ab38f0f93d59e045c1869b2b0edb1d0d640b92f775171ee21b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93261c0aac0ddac69402d019de6c185e0a2ee2a9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:698d91cf517744428b098f1ea246ca15b0db2a160c6211cd85ffd5ae5737dce0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52b223e4ece81cf6dc1eb9dda985687538613560 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9499e5f6c8fdab0ade30d9c1939db4b0b867bb8ae691b4c3b43101db8b6b981 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d18609ba6f8ce0995741574d980f25b11918fb7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7908bea62acf4010cdc71c8f64aee54eede73b565651eb8dd0b9f54635a539f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4fb5fb87581b480ad40122ec6dbcdf804a67f80 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a75cbd8c2fe64c3445c3dd864a100fdb63685a757655cdfb41516c28679ddd8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe7371348b31967ce7bb34c5540faaa5a489c0ae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb6a229e94f7b278f14bc4252f220ad176ae968f38bb85f631e53b6246b6393c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de1103c106ab9f1954f160dd50fd4f456c74f07e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a80c65327c625642d035e8206bc9ca64e864c028d8b4a3406e8669b03c7215 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..165f2962b57da83b2e905740ca4c10bcccb35015 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c67e77db1e65b0d7e3ef66dd00391676dd7311215b5622bfffaed85e1f1fce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f648ec63f72859eae6cf249ca1bdf6b2459af643 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be739be2bc000e184df0c1906f2d27fde498622c58588e4f530aa1136b9ef0cb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de266daa26da03cd8e23c70d5c0910f2a92b6929 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a813c7efa0b3ad8243b2007a3f57413a577c7c0307190e76009703d9460737c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40c14a937779f851f206d41fe29765e85d4bb0fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c9bcb6bcb600ffb07110a26456f23e9072bd867d488cf62cd3e265d161c7c3a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..485740c46fd94f43ce774d3e9f57759470a718ce --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9115dfb212899ffb360d968ee1f191e1c05f081b29fad05e1659f1582e94344 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e78441a6597e0dab69466daeed33a5293b1f84a8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b3e7eb322a43ae2b6315786610c817f0f41c6852b1b7fc363aa037415972584 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d19d769db166c624ffbf17d6626aeb87b881ff2a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26560d5e3301e3987452b498197562afce9cb6802fa7a2c3e2022df579851ad2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed242571b1fefaa3cdb4986a5bca9b4cf6f544d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5f2e6efa120d0f1f64f94c75254890788d379e8ffcaee39bd20d67cc73d476b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6bc4032fecb5c9f92e6c6d1cad36d1f7a4bb938 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c334d456a55ca70a7225ff12a058de95b94693531f71ef9b030e6e664fd5ac9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b26d1cf15af869e1104398eca8f51673dbe6678 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f1c18f7876c22f60318189c7d638560626d4ffe048ecf33ae1c889aa4468560 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee488198142b889592e079d7c34fd956014d0a2d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e271b3662fe37b28996bc7534a1947f7bdb9aea7e992669338b84e0c94b47276 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f64b04ec94adbad70f964b83b655e334be414741 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:049ca7738f944df051e00cf484a6f96e0df55359e5435b2a70a8b2ab2b044842 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef21b0c238cfd178b33f7a16dea47dab55519d0a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:124ed1da711701e4031baaf520ea4b59c1f6759a11929d68fd90b4bc1d34b661 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70f0bdfdf7891c761fa6e2706fed2d49b8e84e52 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb5154de17cad2e2cf74e8e2def524bab84db099d4df1c9ba055c1f67e0d2f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..661d9abf49bc42e33e54f9b38f6f422781ed89b4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eed0989a5110927498cfd58f50bca43d3e375cff6f32b9121c7c6b72941ae46 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bba7b05cc1f44a9c30a5eaf818943bf0850ef31 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e44b79ee2b542b5f233c6cee0cb92915aab5337ea93e338bb57caa3c1638e03 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..601d47d01c760cd680a9c37d53b3a20a0e3d091d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85d62d6fe4d2f7bb957f53ef458bc65bde5a410fefa316a1a4fbecc0a23c0300 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52521906d041dcc80ae00f6e83d0f6d0ff135b24 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f6e4375255e00d6deddeba01225b23173c4226880309b4716baa58f71c57117 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85ffda85a655ab53d6968ee5eea1cd6d5ed236c8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ea08a83bcabf88f1eb99662d4b61b3e3b4d9c5a1d4b609fe8c7cdbae773b39 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae774dd9a8c6536c5e53e2d69ddb5426361c42d7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2e93b368bf17750f5a261d079bcbb1fb1b271cd23caf6284d9dd85c76a98aaf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b943c3664f0d038d05ced6c8178b09dc367c4c18 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:190034b2da4c15424705e3f6ebba1e092cc548420919d20717af502de561c3e5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7b31bd99af4800849299d9946ffbc21eb7526bd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df978fddc485faa40f955dcf967b776bc1c8364b458a3761b9f9173dacce708a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..755a3a3648e6c1a5ba46af4a8ed7fc702d041fb7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b93301c966241676cf0d60e1b734854a63da73f10278e3307e7a9441d483a39c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7bb79ac8e46e0914457c003be586d1c3f5b30bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b020b4450fb788ad45b3c0040b7b6cab31513d3960950158bb239cac4914a836 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df73284a3672064cdcf3b0a6308698cd0953b62b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:959fa9ee4d6f7f1952ba4588126397d40678b7ee58d5082325c4571e1976d067 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c960d060abeaf7ce97448e3516efa05e71a8d739 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:751687fab42425b2bea245f8a8671525106af756e938ee7b0ae4efa1a4f96548 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edbba50ae2d3dcf667bee1b87ed5ee675817034e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b767449575c610876864ffc756d0570b4c4d8978bee3af404b0ecc02b2d2d964 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c79be80bb0f62eb3ed74d881582f0dc9b2db8b2d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4f5560154c52ef171b61d3ee6dd69828383eb2bdc204ea34ba5b4ea8333ae22 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a29b944b03c580bf403b86561306977955a0b94 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391e7f2d8a299a9bc4173d67c73d795f064e31b524f2cf252f74de6638f056e7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50fa609215d96a264bee61dec117f91e456f8972 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fbf6ec73fb95d09df890203db1fc0c7045e7e78292d27927f5828a1843dcb2a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1a12d6aa26ec6fdbd21ce61246f10bec2b1c6b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4e0b986af02cfd3837b08a67b61f9d2ae6dc81cd2f5ea52a0d807871511309a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40c962ea5b5843ad46e86845e5efc9faeb74d7a6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ff766c7860363db3345488140cc19f504f100be87fc100a0ce4163cf76753ed +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b55110fef60383e41bb54555e3ff63184e9f3366 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f06e47cf1b3a8e65fdfe3d44ea33dcfb7c696ca18f697fb0568007054d366bd7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..725724f24f20d8c41f09c0227d65d5dcde846eb6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ae6c94c080b16a0f48c356648b3605c0fa0ff6bfc5b174612814d91ddd382ea +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d9687bfc3b951b57bb9557323e380c5fc5cb01f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f36f4d6d93adc8894f4d479eb4f9bf6c4f38b6b418611badb91d5cb6d3029169 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e543143c69db97f67b1f37f6b797a65fed2f2d65 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e183270f9a8364e6a39279ddd2566eb1ecc07ec8591d6bd7af885c646aa1ce9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dea252390be85eefd7ba311a9c2de447f089dec1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c040364ec10980d3d4fa36f40676b9a22683967b716f118bf29b91e5746f3291 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e2c58b06b4360a7fab58ea5de32a3c67b186ace --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b13557d760a92317a352afef5d1f207bbeba519259a0459a702bdab02070d9e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b05fb1347d21f63b1e2e3d329ea854f7ec9c7706 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe23b2aa77ff95ea632cb8bff55026998feb768ff3d7bcb83f08ada05b559e4c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d3d9d91645a9356d143e8da1f865bb99585aa51 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62bb46b3cd22648deff2d27ccb00c8d2facbd0ee6538b630258e656e4d6efe28 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..782691b1d1095f7e4a45328cc19e3d8e29dc3c07 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e7d931f2123453aa53dae204d4a8cbdba307df01eeae70538490ce68d183efc +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a80d9cf7b031f9948ea122c265e9b37eeb739d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6883888cbe7762f7bf2456e1ef4bd576995c409a44a8160c497a4c9ef13edba0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4f43d6eab64f1fe5233c612a9f9c2080c7b3e30 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28c47dae6caef57ffbd24d40ee94d8c3dd077da1461ed81b1bbf0a4ca039b569 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c9f2f45a2f3fb85d0bf7d7cbf656ff3baaab98b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec49e38d0626dfaa780ea4945d79654c7ea39e701f0b7cb3c7dc2b03f8484c61 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbf033214efa8004df0e92d2d0af77d55fc7df76 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4000a54c659a14379deb3ab7c0fc1cbe7c7530f4cf16c3990e0c05d52048e2f6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2496ad7985a64f67e52e3d77e5012ed6d7161b3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ce064f3a0dcfc67afa916f18486e88899de923ddcbae29838100a9259b2e5bf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..652eb6c627f0533a4fd22a7924f3484547096009 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba8ee6ada0b190ac425cd03f388d8d5abd3c0ae7357a20954b80d81b22366e4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bda96c0b5f755f01c7f08c0b96060b62f4e4b8f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2d88ad6a9edae88c03bf8b8548b164cd2a7d3e5248f8f805dda59b6ad4796cb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1f17393aa4b4beb1f1ced0eb227d8efb605934b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ca1281e1eaf48f89d733fe78884c5fa03e6317c53b460205837f162bd4cd02 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9650197a6b27234ec42c0d9ac44724359395069 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a7d54e92810866ac9019352d79419a6681ee75c8fb379b3d66c2740837fe0c3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41a92065b76466a4b40f112cd6e817dfc7da598b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:610fdcffca22f55243e25cb8057b65af0d344b0480f77b015242be1688176257 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..44f4d94eb442241922ae510f6caf65d9328a0aa9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81fb7b6555eac4cad3cd91a9f2d28d72e859f6bbd8ee1a3e700fbc1b55701e8a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69a10108f94bc86c5dee825a62f04b34e56ddb67 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4449d182ffdfc7ec4996afc9543e1dc0968edba189f1b076a8946fcdae69a02 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46275a0f003fc732a0ccdff3685f5a29cd66cc23 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1adff4177f51e5f28d2021e3364b2830469fe3a8122358af55e469d5f01f3067 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b150bf55ff1fca0fbefcb8e0c544db539526be4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6327fb8cba09b9c4fe38a22058756796c2b62c6050873211916baa63ef0b578f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa098a0accd632e032c8576197c0a1b7589f5991 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d1f1758b38c5872a75a60c20de341261adf161f35b33c688b3d9f14dc508ae4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75a08af7a2a8e950a29704fb988b0fbb8fcf2c05 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be0ff75f5f5f93142eb53246b855b1f04618b97b486d3da221017ab559833399 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b683e3d4f81e0bb60eb63f6ba20563923a6bc0f7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfeed7b7bf862c8feb821cd52417a0a2ad910d80fe2b87d6cd9894afcf29fede +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b98f29f44a4b5bf290091281d830137b3020043d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16cd5e6cbaa9b3fc73dbfcd76938b2844e70274a052b3991bd898e6f9a6e2d8c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e9b558fedc7f9d091f5327878aaaf6d3e311abe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0f98824f6d8adcc9059364a9af9cc62be0f14078ba049fbb8cf6f4368e2304 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa7a675b3bc6d843d47e0ce66fee0481998c45e0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31118130ca797324d5d8413ba59e955602ba136633103b0592d9419d8eab95db +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..17ec02cd5405c7c16e70339848b9a86d6900ee44 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d52e2231237e6600809647703291e457d10e60d1bc040946944415d6cfa1d873 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1abceacb611fa8f13cca217ed34620389044a1dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:626764fe63793e7ca53d78ff265d676a4706b98307b73e3658a9c7f7d0bd2100 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5935deeca256cf387f4812e13b6a51fe18d72ec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:138b2bb13fd000b587b6a2989272ab66a28ce92e42ab1ac25bf5f3421806feed +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1001116b5fc018217dbf5c5548d0eb378a4f28cc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf59d5e362346c08b24a3e7131a7d92b6e83d7dfede7573f54958b74cf35f5c4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..87e26bd0531939d97a806ac8c193ad627496e666 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad646c0b7623a7ece9f3d65fff4506f99ceeb70222aa242fbe530f6e8de22772 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec727ea01bd4945a21ef4cc1806e6d33a3850072 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1880c7c2cc738a92fc1b4813f0c9dff1a001e333ad0f003dc6ed0486f7450f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c038320bf0941e0ed00eb8276704afbf13d568e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cda2f2c7451d62ac5a91f411324069a2843f72d76d390c2e61dc80a52f4247b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5335759f8ff3df24c290dfe2cbc907a0b06b13a4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d99f60f9011e6420e69b5f203d2f8456f7c064f18cd6b455a1fde415c7ab85d7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d46c28b673e2a090e58f6a16f8a639ff468db8cc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64acf712f8a5cbe7d130e78a062aaa58967a4a953efa08d1641da820ff654b01 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe8c8542480818374a5c2cc20f4860732ce901f9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:192746976f75921766e99333b47a15f63e169d21d9f85813cb7f23aa2b8aced8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28a5fb58248bc5b0de9b94f25adb97f477b30e0a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:922c7c4ba99a0a240787389de55355de1b7e87679fdb33d1f2eca70cefce1604 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..993ced83fee893ea7d8721ab3d4d523868ceff5e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34833d203109658c700592d51c510f07ddc088d531cef769b637b59b76cf2e9b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba8609b4cd95b42ad1f105e234aa824cd2937431 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0d7ad61c2d9a4a1f851d3401606837f19c2868ae46c832f365566425a13bf13 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad88fd3140e6c727509b4ee9092b5d8db35abaca --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d23d45878c5d4b41116e7d5947a1d75a66525787473b40118f2f171c7fca0312 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f3c5239316e66370a9037368f7bd11accebb4f1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c28492859902961e194c2ac17a4d4be89b862cce35ba369ffe48e4f1895d7c4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23e3c41a30c554d9deaf3c275872081bb129c9ce --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9874b74dfa054165978aa5fcdeb5c9eadb77f4b4d35cf84202f2a35f3cbb21c2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..438dfa52ebed9c6389837972f7bcbe269ccc151d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51623d469bcef7ea1108709cec39824a0d9084e3a345c66069e712631830ec7b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29b347c667a87c8044c0a3fb69dc0e6614782c9d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:812fe59de765f8e1158fbff2dbb2f08309f8ff05ac91e1e05ba8a05b20022585 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..847f583079089a9da2c36f84be20f45e165bf763 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9810647bdfd67fe6f88e69378d979152d114de938298b63bf3537788114eaac1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d99062ce91ef135b65ac10c22b56cade6f93166 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f24ddd9d4c2e512e7d1e903ee674d8e566d41a99a2bfd4322aa24b00ee45d50 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc435743d1d1b8de146e245f2fece44f94c4be27 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ce39526171aca0f8afbf249cf5790bf9da0d7d667ffac0f7b14d765ced81c1b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f45ad5bb519fdc112f0a24dae5d1dff13aaf00f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71884b373f11a41ac6119999d7c684b7610979d6d69597a1a75659e71d310be6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..24008a87403b843910fcf2b38166163c55200c9d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd2d7130d13ce3724d126bfdade4d13cbbb8adb7d8ec807febff4b7cba824240 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..618579d79ee11ca9bc57ae4cc31e54e4c1e2be58 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f38a15264ef479322057f359facd02920feb5b3e271da7a2af63bce28b24673c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..05dd483b9e32eb76b081bba8915331b97dd1acf8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24bab3434dbce17124bc33da712bb8c6c44977b472ebb9a058f4a73b8b7fd379 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b848f20b53f129ba602d0cb582bfb8b3c9442bd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:681f0441ef21c15ecf1064dabeec531ee594792484f779bb78c089751530f5e9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b45d49cfcf24444f3a6a9dca80d8597f1e12c0da --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fa0c03f647dc6d3d65bf5c189c0ce2cc2990c415279a6b69d74b4c8cb24395e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f797dd3ae22a95284a07453546e302bd65fd00aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91459b4656ce3d2a2895f9dca847e61bb6e199513bb65ea7ec56f2250af76de2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f947b484e8de7998895a8448f29089f2fbe2aa2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f11490ae465ed2b3d4e1f42cd5de3aa05d2b7cb0f6dddefb55e5d191a123b10 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..153b14420eb3390b5ed50f2346438aa1ba4c2b43 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971cc61f39de3b0233ac7325310cd4d92634fc078f46c1a42411e58fcf93f715 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3835bfeb9c907670371f0f77d9378f9b5526b531 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35fc2da5f2ed9c765c908315ac54e92656937c48a77b83da86156e1dc2edf7b3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e40df12d7162204f240d9f6763bd292e106d240 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a00d0f1e9a937d3b6fec1109063ccccdcd15a88bf99a68b5b08f369ceaa60552 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfe1c489bda38d73e7acd0f9272f0a313d46becc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f8babe7f16f2d8cb5aa812460f9a26fbfa513982e5a5091e7eb0a6ea3daeeb7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9358d2fba6b3a4e3b759f255030ab30976a7f9a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f4c1b930ddff9a4b13e4864004270ad220f1e0e1d0ff5f219cf3e08351b9382 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dc6bec36d49d8bcc45a7b23120fd50beed88389 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdffdb9fc9e0f59458b925127d9918a8ef7385b5173dcb01a79b5203a62e40bb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e259787f8d9e1021a3124a7039d3cdb4861f1236 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265e729a22f6041cbf7f844da71a57ac1e4f87ed75b0651a84d652ec1bcf3fee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9323cfd9113f73950ae54a3adaec1d551cfd02d9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8afe062f8985582748c444d44a28437e848d420f3180c219cc1bbafb03db3ca4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0973fca82a224b3ab12db4eca0b7324a1c80bf5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcce53e383004f29d79755cbafe156e758247ba163c6f4cbca08ebfb28414da9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ccfdd8d1168db86754858df7d0486b9f058e1af --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f48804560f5b83ed3946bc5ac57b9ba196f884c0c76142a83256e82013050f9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db2c61dfbd8ab5d0623330a23bad569a8749f651 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1843c8d3acb9b66fd71165a9b8b49cbdde37fe27631f78ac541bf14d819a8f6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7454e3e7e58356987cedfb6d425a539731c58221 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0476cf6671e6456d88d7db52d0f20ab5818fcb17af450460fd65f91665d65f3a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2200b73cf245eccd9363a365b006f2cb4592fc5a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69a98551d79276984ec7a62624f8c811947fe3cc6a04dc7764b5a7ddb4162824 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cad5c13863885d61921a6087f4180b4a9dc5a06a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b9952083ce9a7a613d1260ba47bc99c3085a4700b70aa5adf062b35fb466420 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3104b9b9d11bdc309843d6d584e48cce37107d8c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:237c6fc4d758f957e98c8f01c18d2e9c6b338dd17fcf23f47f438b8a8d704fa1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0fe5fa84c7b02981f422d9aa5a6508ef4095b16 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59502293417a9a9c5f997d4dae11f290a5e2671f40ce6e6cdd3671fa9ebc22f7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2179d4282984c876a9b2d868fa1cb9cc6545e9f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6036434b289906be770068259a8f02d11221f3769178d0b5f9e5125ecec44f3b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0611987013bece1404980b38ee0051feb0c5bc0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30af1473434e859dbba6200766e0f1935814160c55c9ee1c9af00bbd35634e39 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87de5c7fd69bb1331858ae32288599ff3cf73092 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0033552764fd4fdfdef49c150e1ac45805685d235de4a567e1586c29a5f865a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03479189f67396fed16c98f5142168767208d6ae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:375f3ca7f50837fa2f2554faf1b97c71762551410cd3f369a8049163154907ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40154f309099ba69c636a83ddaf905f7ccbfa1e5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38840e24a6080e8a832b163452d3878add644460c59f0d52e51310dc60f76b50 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9d38cf3faf7dbd9629989a00ff6acc4cf380730 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4379d9dab4d1be052c540dcfa54c6211cbc10a11f5d10810fa2ad6729e766e8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33e6747d4e39c57aed920382017591bb3e18c4c8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83f7af27ee9c9992f49994462d0024d617c7fbc7689b3a21220cdda52dc19df4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7702ed107354deeb10247364cb99f8384162b70d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2f2757cfbec9398b82ba759948128eb3e7f33d1ff8cd690857276f40f926a93 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c65f555a65aac9d5dd2d926beed1db932a81f13e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5b5d412494022dd8e9edb687abc8cafaac0f62cb5a5dac370f9340e622875be +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c43e3f1cae3db56fb26f808a7544c600fbc39e12 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b34270dee1cb539cc066ef59be7168c3317ec9b718d3251228335ab9390eb6a5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48ee7f6ff280abea3b846a81bea6bfa3c14f0765 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d6f9cc1ced385410c65c4feb7d7d721fabace9b284fb51174afcb664cd69743 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa149f5e893005df87caed6611b30224a425f1b5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b86fef4e1f6e4db2cbf61e5b8c9ca0828899c8cac05db6c8db85687518c48cba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0e48f36f99f55a193e61e4ad7f31c0464b92ce8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c9356e8b586563b1f7ac78b728caf547eca77f1fd9fe4b796ad643b3d583112 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4228e057fe7b5e327b2e3fd34fde493455b7c28a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b944da4c3370c9b1c4c8abc5a15e252f10f28aa156f35f0011ade1d10a5b7684 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f3a04c53e71cca7a00a730d9e811a13936e8580 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bbe42581cc6a3cf5ebad34d346d8354cdd53f51d9ff7d50b7d7f477fa091788 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0632b3a0e4081fc1cbd2a150cc4f7afc6893a20 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9368b95dc6f83f203bcc9782d12e849f3eca5ac393cc101f4186d1047903163 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1ab0c017f538d751670f9997d04304210a5fb8e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:830b87e7aa72cd0d64cac694b92cfd686daa7a92c944663c58cd63241e3b1275 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d573b296c97bcc89b8e725c7eec6d58d0a6a442b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69517ef9b12c59908e77c2fd2685d986c3d3b53020482c95401f19c777a932f9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..613d5403049842cbe6033e6ad1602a0628de9123 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac15871f42e48c2614f0518111afba6dda0290b4201da9c44ff5624cae6b6d09 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e9b21fc9e5d36e13f7f60b5608c5e25739e6884 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e884a2e00d26a7c0a18f04aa32e2c04cdcea22afcdca0d01460253412bbc18de +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c65fb29daed3bb2a682638234272f352d34f072b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fedd85eef9a3726ee409d15e427d31b2a509931f19f5fb70844bb32e82220168 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b523092c8861225a45e8caa0f6f302ef298feee5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbfa798bf47042956ddaa19a68d3ffb08e03792e8e0edfe09956637afc3bf98e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..268a80151ac5880c80a60b950b49992a9b960ddd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf6a9a3d3ab8bde5d48c1be40baef04252feab87144fb27e8ce52444566fdaed +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ccf189b4ce43576a1b42c238bef593701452907 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42d2ba57b910019ffa991ccdb4973a95d416da9d0c389e4f2458d7ff731c728e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e1866a68a7e6cc0188dad448ca14e9d8241fdfa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef9f849c38dfb18cfe84e947708746410af8dc759da260052e39f243f938fab4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ab9f9c999ba384a4017ccac3b78da816e6a3d36 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce71f2ec0b76d6c91ab17f0a99badb2572cd689a3bcc0b0c3254d6376154aa77 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..faa09d08954cd7a10f15bbc8f16ec88b825fb5b1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e96883847add612bbb46d0b2610471438aaa56f6de6eea77fd50b4e4d4278bd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c518b4deda97455d514ab1c66051221b2e6d3ff9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18b2a6a740a58658587b07bdff8a3b291e4eabccbcdd11bf14649ec3d0242cd7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..595b5f90ca2a06e582161838fdf7ec7d8da757f3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3abdeba2cb76e6cd1fc5fa4bf682f531b260b53aa40f1878dbbed650620d67b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0d60659164c966d601dcf37dd2f4ec3af7c651a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fd7ec34f1b4cc6761e1dde21dd4be3fb348c54cb3bac364ebcc1c7af124e143 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f9af491384989bc365321302e9cc64758cec0a5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eb825f4a91fa7042e92ff52d00967cc29577614602f298e1d044c5002019bc4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9f0a9a718bd8277100b6ed63b092ce7dcd78597 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa07e5dfdbae6548216c224b6df61bdc1c0c30aa525c93b3b723ca9ad3ae311 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75e338c6c7818fd7d5cdb8a9d929c89ef1d8f77a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a2a66edf494337d5e940be4fbce1f998fa324cfe99e01eab0b3e16c5ab2a593 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28a3bc483fe3b524c63e62a27beac9849ed946d2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66de49ec74e566dab789a3076293d03f78289f030b54b0f089ad41d11127a341 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e926c317396578ca4294344949dfc0562c862ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bef29800a5f48deada152fa5a6979ad9c7f6a35859cab67466ec3ee10e777e1f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b85605116975f818f02dce4b92e3e6e6489845cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bd719b2841f44033aefe3a540e6df6f31c3ba14501ab022d291179b9894a21a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d170be725260bdda9b404da408fcf42d7029accb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7793e3cce0270c645ad54b9b3330c474f3eb43746eebae458a45021ffc28c09 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a1d4f3eb783e56af9caae6e7bcc6f8c236484b3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e723938401226ec78d64d30f0a3acd0f0214aa5acee160b7acd04705a6d82cc0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02031c0345f7ea726aaf9d3eec2cd32408a83cb8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:422ec757e3e3ae3d16cda54c9ccc552a88f1f7dad4978d497715fc8201f725fb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f08cfcb9e16478d7ef6e2b66b7253e4d90b8808 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:347dc0993b0108170032f7d32210b6c9b27f38735e3659fd9d98456e29a48586 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc79b9426d4ff781eb7f75ea0aa7c53d73bd526d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc81ea3efae83e6975306efe772e27fcdc03d640a7315f61bfb49c8bf70fa46a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..41ef762645faf46c88ebb6d6f6e95d6fd47275aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f93f47ae532a1967f474b2b6a6c8bea9ef550ae0f59350842ace50a7b6e384b8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a67ee6392bbd78fc0e0f86fec536aac257a8afb3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3854d4b6bfe79ee104e1ec57aa97f292f583f48e185925d128528f7c4424456 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7e85a7d68c12cd50e9915669957470a093e3dcc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a24ecea5e2d765c91221d8ac64e47492f6b2e22b699a4cbb20c4eef2b1b1f481 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85851c01b606141f60c02f3ae02f2b591d687abc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4897426e3949fc6d012bba8c36daaaf79d5033004fe34920e96ba6b1a8fa0059 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e72c395f85e28c69ac8a3f7bf6e5fd81e1f29589 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd8f2a63fe48f97b826b3bc6408d35089eea9b6d6ec4897162ae42a39ceeeb9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23a73896af52d105b83170ca5d0193fca4f02752 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede1bdf299d602ee40ef7de2749220d230e864537921a2de2ee9eb318f005a94 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3b4a78f8eb03a34db37b8c5acd583b651a105de --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ef44b979fea4200d56271d158203cb77d89747c5ae744f7c2b36f66454a2ede +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcd68ed450cee09150117649a513a6a004dae0b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad879223f94b0bad3c0a5a14abdb8d2115a4cd70c1188ab3a2ce331d03ca034d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d736d139cdcadedcd029a3514ddaa39aa7ed2b26 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9148c18e62297b4d537b4f6ff2597c261ce094da38bdfc1e1e9348d5199208b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75bd26c4092c4634f2d24909fcb99627aaebad27 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d28f09a363b9768a6216f34a4fa0117d817b595ec93cdd20657dd48b89f6bc9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaecbdd1fe6bc9ad8e4d1b1d5c773229ad845f21 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd5d869a5a968596ff98596525ccd4af6ad0c4ed5583d95aeb60248f9d93e75 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05aa4ef1d1d9b2347c02fdea86d851d30437dfb0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20075b18107353b3fb9a994e556082980a54172eecca031ee2fe240144cbbdb0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f1153c791afc538598bc323bf72e9055eeffa49 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03eff7b06f848e451e269728e02fbd76cc7b0df7823a6b7fcb0b7919dafe81ca +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cd7e488ba952227999fc21fe177699ee689f037 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d08e42be9ef46578d67b95850ddf3bb891efac79f3edd2f9f77588aec196d5c9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b96c09fd8e11ac14a8bcb3a44ebed1c4ee93ae7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2413058283b2d0b630c86920b941cc6658e5e792956b6877012b01340d347abd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3186ae47eb2b5e6c4961d43db2ad75739dde8c3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08837bae1e95d013b00d67f822088a5160b408b0799b56607fd6a2a7b9712133 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03836837c38a9cf59d5a6c52afea81abd5ef7489 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:118966e564822d39ff4183843fe7274114c11f691d43177c5247d4244a492e08 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de4a0567a6de1e625b38b287889937392f2d033f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cc2f77eea183f54d9bee1f3c325b6c261abbac0be3ce5d4061692d28a29b1ce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d104a4a0c0eeb733a2d394c455d5d25cf521173 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f282c437f21c5c46ecc98f0bea2acffa799c37cf4314f7192fd92ee86f218c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..35267adc587f100efee4878be71acc14dbdda36f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5a2f945cb00085561626cccb78d1757b38d4a2d98bc2b1b8dbe105257f62627 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e432185bbede3e64d93ce541bb9b74148772b04e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed17d2afe4c36af6ee59148662904dfd1136da13eb5bc40b0000b1fa090dc493 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4266b28fe8f1076dc1ab61671753cf6169223c8c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c845db1425ae0536f1e2469674ed8d3ce0b5cf497f1640491208cde257f6fae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77fe417e7f5d7394e570d184f113166199e3ddef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68c1d872903601aeaf3435c510dbdc7779977c1c7febf13f576614bcedd26f34 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60c8c087d8564561095440596ce7ded90474cad6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25cecdad8f5f18ba1603809248bfc428d3ac4d2c289da55fd2d06e197a1f0710 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed19ff07cf143f56332e578b0f18f46139a9be42 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b252c1aa9c55eaea7c2fc174fe651938c0d6338286a68a18247c09a760c4f040 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f895d387570581e0283367e90991115acb08a2e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:491294d908448647ede08fe4c86cf52066c665afaeccf6d344698d876a5b03c7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..707ddbafb6e1c6079c57c27d5ab4f4acba261842 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84583e44ced8c9779c50e53e1469a1f945c38347953147f65638401dec55e5a6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..845e0da3b328cd22e5a139f5ff6d4bdbc5c5c993 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b2dd7293759422e8f2b3e75151d69a256cdbbcc382b2959f787698102fc0db8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d0bbc7400547f7f3474eb65ee205b46f28d8d6c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:052d437b0e0dad7ff05710bdf926c96887801b16f3a15d5a993bc71bb3000c05 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d0c6ded82d6819babcdb2a48de904ef908a2af0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e12678a50d5705aa53a4cd3f31b98815b198540d3765994475d5f5ba0ddb566 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..caacb90bed37f1acb75759a3aee5dbd0f16ed207 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a33383bfb402442476088cd11b89175e0394fdc25c28ae14ca8fa2cabf3450b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e3283b940fbad01c27da0ad7d5b5c23d91acb1a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83a6b111a6796e192120c0c94c472ebf2215cecc56184dd65fe4e8ded266e878 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4087b8daded6ddd8b2ecffc74cbf66e15aa251e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7d55b236f58059b03a477262288cafebeb1d85656dd317c9dcce6310c220841 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..132735cc31d361ea03318a4324838399f943e0f5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a068abc0759e7514e750b50267b112b959e27209d02138d0f4613fd1abd0f6bd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9b20d592913e5fb478326b7b4c76b3f3132fe59 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfb432c5b0146ee427ec9e777ad558715352dc606e989ef3d1122c6d0411f226 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..028d843ceb4c0420dd561bc9c5669e3f3ffe3fdd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4008e0024beca45c5779efd2b85f850101d2aeab56eb1ef5442e32d2bc619c5a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..83f2551ac3a8f22299f3b2515eec138e27c13156 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134145e95f27a30c433cb09450ff52b7f3c3faadca15145f2eb7403924275994 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4533c78e8e20a0935b9b276af2791fa24a58964e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c42848950f7b945d08016512ec1c19e312e8356d234cc6de3b5a3a3c2d650dbf +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb254ba516d778266e8f90fc8314ed68fd543566 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2de595695c42a73b71a155cb40d9b3f46cd871b1542eef9ecf3c701af3a685e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9557870780b42ab78c546124f97effcdfe2ba502 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4b2a16ab57673c7f9a5ec3a12830cb5c746d4a8c33bf8f95194bcdd3f91c4ce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2125a50887d4363b8eb6cd6c58c8a736efd19f29 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b9c6d201a69cb07eca7603b72adb12f9d10a4532e8ade761abe12ed2f337bc0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd43c8a2c9985faca28cce826c7d1f5dc2230f8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbca1630180f22bdf49f9d0e640382aaf4590f1c52e6596aec08bdf7149a4129 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00a642b280678f5c88022ccd1e3f1a217b6c3b8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20e908412161d22420f38b6a6bd43df1e7c18e8fd9d97cf89f651a0716638bd6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04a0593a8b55c3578975d6c645526f63b85cbc4b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ff5a792e60007afaffb19d088af0115fbf1918d7d0db6516112b305a6c119a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b339dc8cc49d0f64df0cc233de4c0002958be325 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13de512a793a2ad8df12177e5b281b6b2caefd172283d0ad07c914e58cf03172 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e554cdfb2eee00750e1c7d838a762cf4c1324969 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9a8eea7f83442b74bfa1ccf5f1b978367a15d162966cbf82f88898359b588d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3d2fa7ce0c264e0b3639a88b68042f82ea94a6a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:687fe89ab811bc1f3baced3e6454cbcb23eea870d0d8a183ff0ed310c5c6895e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1c851daf3d7562c5927d03075e8ba3217131451 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:005b021eee8f5541e9ea1fa0a923cb1eff8274c17f380db3452ebebb40aea701 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf660501c264c80afa470282c3bd0c6fc6ba0613 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f7ba68689080630ca753964b21387d1573b988b54fe5e899709efecb176a51 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f91330b5930a1a96ab041930d6f8018b8d479ad4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fec90ce938435e6e24ca80d65ef9446d2c404af24aeb4fb7ff3a0ca2e0237a9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7b539e51147831fcbf2f6065a45e77600cc4862 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb92e7ec1bb5d1f5f66469eb5ed5ce8fcb9b993665e48fda43a97c74055d9165 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8f52723af2cbf1d30ad622df8d95f8e8491621a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f5daa31f786b0991863feb5517528cd565533eef92dc192987ddaf39382a377 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6faddc4987e0157c4ca781093a20af11ddaa47e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22124b806ee3b2981896d0ff2595920bacd6572d1ccfc1d0d6e09b8439b700f7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ae00b71b953c81e4519aca2bc5569229f166f1b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4044db9bf2bb9c40cfd80578a7aab2296b257ce238b9af29dd917ddc8d63819 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..861f7700e04056d9e042081111fe45a11431379b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4c9c4008b4fb27c0612d86119369332de17d6b0382fc1776b4f7e143bd0998 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d514aefd0480679f6c76669288bf1459ab177b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c076da7810d58e2a2417c60dbe00d5131e91675df7eb1b27e400c144b4684be5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc1a54aaa6d74f7651020f6aeedb1cc1b338a91d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e53a442a23bd3b3696f3b7191ea5d881a8681171209674d41c529f18e5aaa791 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1559be6544b4669045a2db026fa3c7685ae51368 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9c95e68643f76be7f64687bfe60e99bf023540f84663b54d9492fb2099a2251 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..36d96c9db93161e8d2aeb5ca532966f2e79714cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f4b37ea08a1a90e80224340d5f85be8a6e7831b277ac52f2feadbdedec25aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56a07c30d25984ea30c975fee5d2ad3c602a5568 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73e6324df1872d72863ef5e33f53dd7601734fd4024efbdc344ba5b45479d80 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..968b5315fc4d3e71c46e8da4148107e427aebdfe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6064fb393f40c13a283a3a19094ce8a143c90d78dedc643a7b0cd6f6ed194922 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f21129ce985ff9387ec3d2d9197df6d0c639523 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9960c8758454e27255409afb4d81d7d438e794ac56a4be20bf980c5df2ac2dc +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e671dde993c976d2130ba51a0295f6ca7e87efc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a42854c4c5468b15ab85a1d520b8a874bd9b276df3e9b0dd6d1245d7889324a4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91eb358f08ad031968626f7845c0d8c3b37b453f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b885bc48304095ca5cea86159ef8d88dc5a3dd0b6d94fe3c3b405e01784b8c7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8867bae8e2518d07a737b8ff2dfc42989ad1c42c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6173c282b934ad2fc94b67e2b3711a236ad2a79bf332027d430995445a8c5eba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3ee9aabda7731bb9b04431562827f9cd1644272 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a71e94a52de2ef6154458402dfd9f2271d5f6e225a8b9bfab8d420f36b6d265e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e3b6fee70b8803af4d3ab2629960aa80310704d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b433dd65ef431c1593f0e563768db54138ce6b10cc6634f3f3a4ac78145bb930 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61fb2904fe4cc9b169ae5e8881f3182429e5ee84 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bcf8b5ec3e97ef6e81b7288abcb2405f56bca24eb4bbf674864beba2d8fe52d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee468d73a4605d443ebd1bf4c30e180806fc87cc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c635f65bd02fc8b9e7a6d4b4d5eabb2ef02245cf991b837bcddb269a390cf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11d94e018701b60d21c0e6c8a7129c5b09560628 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7f565c8db6a1d68ac3f6ad2e582d9c7551d96c26542e5252b057f739130aeb1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b8a763b6aaddde413be3a0a0901e2524253a021 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ef9abb17765251459dae825b000f375d8aecc027622996a6943131badf1967 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..174ad02dfa3d8897c8d5680b1e83c564987b64ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c719b4eb640a3cadb4fc0d99afa2613b151924fbc1ea516f307052e27c243519 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad59d95126a367fd8d99faf779b3cd3a57b02f07 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c633a4b0f945a76248a5a407e96a150a437ceeba1ca009159c77813e69dd9e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95c31df67e1013aee8de5c858962b0d88a052bce --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d7ece7da3c5715eeafef72b55e5a58f0f9844e35eded132d84f37adab463bed +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..04cf732ce6d86054b4c82ccb0f685f3ea79b19d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb7d696e1f8269a32cc8c08193e4042361ec966c8f946107a179502dc2a6d170 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62f3d9f9adc2cba4f1b23a1228766ba5587ec990 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1303ac032997806c154e08dd427234d8276b5c731b791597c2ba0da4c6f24c92 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf2ae06a2402aabd3b83944bfb4fb1b1b654d152 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed3c3114ca151e2a798c8e8131bb47e033846f455d717b03cef8607dd2a3232 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bdfb82ee6e16d68cc44746a559780960e6b7e77 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d35cae9e9896e809333f4ba11f6b2206312a67503b98019c9349b973631e554a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28ef6e0ab96a92873e5a3597923a17a9ca3b0edf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794bd89f21166e9961f0314400b1bbf13604d8291d0940078bac9514ff8479c8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95894c3f49fde74983eff85855ecbb0518ee7c04 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ba9e8ecd8cd91f8394b88a3ad63427ae69399a4989f82acc58cae5de8a5563 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcc1b5cb5e3055e3ad29f5df3b77b2e6a3a8a834 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d4e09476f2a8d3bf04a573e8ab8fea9ff6f4383606ec5da728f4fd141713b97 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f88d9630cd917aea2710d171e2f6c4b86c0473a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:625f91f0d16ec0cf72701d957976d43e81f65b6281a0c65a0fce9c6190c8c803 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3359840735e54705716c89042b01d76c6a158b4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:782696687ca8ffb10e613e7da1b5175133bd4753c309d8c6e8d057eaa9d4a65d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3457571bc06797de2a4c257b2797cbbc976169f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f9a9d814ff0abfdafd4b517c07044c6c6534804006c0fc6cedf773400a3d89 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b391d7c28b966355f396f4d73e15f189fa9035a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb451e3c5291da7ff286b5b5d761e89d89180f6e03a1cdf1b6ddfa551be85d8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c79df76bc70068255d9234d4d185b1d9991b67b3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ec626cb41f8bd55b8c1efa8faaabce04052608965917eff076a27770f57f953 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d55530afc6182ae536cf998a636d1e86743cb369 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab4f17189b9ee7a85f951802ace99de2d2866b051473a7cd3ca7c9112e49b521 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cd5de689958aab1aef2e5def07356a15ccf28db --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1610c3b8eb8f9de7e9406a0ab06a5327f0c517e65997edf046e992eb67de6f9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07bcc87936238a9aa235604b6d21d7bf5de720bd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc3f9872c233f1ae2738d402b7b5a5bc2cfad5c4759a090bcbf569616cc4cab6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b08d2f7824308299e01b900b6523da8b63b8d9bf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56fabe67a636ed54a33cb19f0efbe437cac13fcb684fe911481c693487dc44a1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca45c3aede6c753c89b303483d8c1612733a38b4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f727243e62190c5f12f66003bfed58d76c66d813538c8142d0d135ae2bdb8cc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f00ba0b7d4efc423a9af4553015a843057731c1d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e8d6db3b670cee43ee1bd11679fcfb33592fc62f7adaec9bdda177a453b898 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7753195ba86fdab986dc07c4e8d3c31b43089bbd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7355bc5aff6a0a1ac1a4599a7b542aed05c11ab51c5e5017f6948f74bab81abc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4f81ceefe4018bca9e511cf6a81ec036fa134ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2060980bd99a49e1133792824c52928c066be832139eae707b02e2415c008482 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eccb4ae340854523bd4e37a308143d6c2565c075 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff393a61f1850dcc18ad365770fcfd0643c1659a453d555057e2fd948900599 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..299b55db3fc83c8793c732d8e95e8791aab62b09 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28a5a440dab234770210d5045a6c3f25e39d61186f0308fbf813123e6d8f4dd9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2063dfc6ccec6e63e137f0fd984ca5af9479fba0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72caede3df97e395c9a5309155ce97e2c5fc4fa1238e4f1c879be249b2b677df +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81a0eee07ecc61fba61afc922a3bc433f47de341 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:025ea808b7eb92a483e0ab60cf506a687eea6e230bbcdacc456272b24a8db5ea +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2224714ebc6673191b6ac7a94f7d5219c020d267 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23986e74ebc4b01450150cef42a4ec2b89a515e5adbf7ec4c341f31000ed8b09 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4335230141566b4aeec37b712796c5bbd095e21a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2728cb6a593896563f88a88043c141cab89e9f9ec0a0d39b9b01b857115a1bfe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e07aef01578883c9bfa2abd87e2ea609f28144b5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84ce498b71da0947f0e654f7028f7b5008942f965cd131236d84579bbda1439d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d287a8b33c2e652baa400c87e6e6d04cc06f6fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e7d4ddfeeea24de6d025ce705024536ccaf2eca5bcef43a0ebb636e87043f8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b787ebb7010d21a95e8bde12b7b6346fec2a0bcf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:775cbf47d2578cedf794979064ad02749efc788047bf540f521c3a49ce4a7c7d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..470ac93d32d6b34317fb846e0542adda699a414a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2ea9341aba9bffa6f681f1093736ebad4afd05d3c05b620b8be2772da27a29c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..97491943ab560aa4b3cbadefeab3d35ea243fe3d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1a67151db411f9cb6798839d006195dea9801806861f2cc54103f34f88589f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db25b648b6255bd0dccb6ccb404cb5ea27ad2a51 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c4621fcc8725bab19b7808f77b1d4658b0b0bc68c0e99d9c827d4a4c3af5706 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b74c7b306ca996a201937bab6d9e1679b03dc6c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5549bcd754d10a7aeeda2e3b52af7407feabaefe9130aeb3265ac6472ed119d1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21735fa0ad4b4b4f733ed93d659bc7b7520accf2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ebc21f679084003b6c114b2ef03ce2f142c307ca31584cabe4e203938bf5810 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..acb3e706ee18a60cddb6baae182ee6defabd4ad1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01a42aa206a812a84b2ebdf52434480e25d28538b88b47c23b42a99bfbe5868a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e38791e564a6aa9a06adbe4ccc7ae172d55654f0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b1e4f8219562b3f5467a020b4ca32d561e2dc15fc0655d15aeaf21ce16b3c26 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cee64ef4fe96ac95b2dab5b577bf52e9daaa96be --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e145614994de6973a10ddc8b2704e72405c9fc7015630c70e5afe41606bd0353 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8426af9c5d2f5d56984603d72acb4c00f2c4f740 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:670b396b333f1d6c200c0feb371bb5e974e1e71c348d76fc2d33a771deda49d9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..918814369e20d549c1176fd968e6d305ad59eadc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14c4ccae87d3ccd291d042e3c3a400ceaad4d0e80d7fb737ad8b43c345fc7164 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..292e4bb8fd6df500a3b0b89cce9a1c79ef6b3044 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6feeacb77bc14153e0a9bd34f93af6c70f4bbc6ca63a431222e6181677094ca2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..534794fcc0b6a440a29caf9c5b8693a3e4c3dad4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4405ce0cadda84dc8dc88a605da65f058ca70871ef2c299fec9657a9a3adbbf7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1df35930ab0e763f4ea6e88e472db3d8c15507ce --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:076b6469861314d58e0d4df6b51ba7cc290a311d4e8394a9b1a48fc4a8b8f530 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df31d48ccb3936f828d82e5d07b363446e80961f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb255ec4f09946e7e25294919da4e57299041831f1984d9136d4b51c6641bab +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5537ee071fa2d3d33ef3ee4ddd1a6feb3ceb6b1c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcd9ea26f0ddb38969089e1dc9d2113d6248c957ce672d2c445b9cd3623eadd5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4231d1a07008b818579ac070ed402289514cb56 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05997c07bc7db977dcb1d13035b90b191a0daba4d7b25ed1408674e1296da924 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4ad623d46f7d50c1af08c02ff592d45a1a921ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c793982644c776664a2e321b56f14329d629fa4765f40e0bd4fcf989a7e9bd22 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33b2f74afb6e5d97e5ece6683ebfb95d389dfe1e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7346f6571508937cbf3e0628cddc80adaad23881b0624464e1f3682bc8f197 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0da9e703c32d2e045ef776e48d067b522ed6aa4b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b37a395693df68d6dab7885f44c026ca65b6f0003652366b53923c8fea41edb +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71297f3207256ad7bff29397e4c6bad0dff61a9a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a9525b5fc29f58dca27d2e7ea4dbb180c67336bf1f68910a55a04277b1e8521 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92470b3eadf865a1fc1568bf77f37a98b0cc3b95 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da0c4cc810af68e49460fbf95728ba87b01f74aedc1ced454a3d5e313fec22c0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e511236b757b77765f8830317ac7ccd9f48f503 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc2cd22fdce57ec8279ed3658e4466cf023749c6caecb81e03a74ad274db1542 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b449a2fa0260b654504ece540d832adca33502f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2c8b052cf6309e3084608edd97b86fcd9a45b7195463dbb51e0751f88c07535 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8fdc369c9e3cb9bd82cfece8802acd6f2f70386 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf6e32b3253fed02c4d9f5b55d50cd3c1411aedc23ba9089c02024e9f6c8fd49 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57294f956e759efcdad49522a481dfe83742f94a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54b501dffd343950f8951cb03eef7401b09a3b41e3c5663ef4091551ff188389 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..979a3a7996526e1dc5d050992ac8c9699a7204b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:683080e1178012dbeb4d95bfa4e06ab441c4812fe8a7129052ba28e61ae007b2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..177abeed07fce35ab5e745413f5bd77f20c30cdd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bda3daa6a91477dc8de248b57d109af0bf01836c48ec6761bbfd57290d9920f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..253187d1f8a919866fa716ad3cdc8ef4833a96ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd2d2822b1202e26a540ebd6804b363a398b206733f545b0f15db4cccf8101d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f687dfae5e65bb6eea87a1f40fe0ca6abd4f34d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c21b80622ee8d899e33daff3426c7d101f0636452cddc4551db4cf60a21a138 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..464a2eea5d206d2a660353bab6ef5edf282c44c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f864ed2c59076a15a8fb0b88fa75463ff04429d07d6c551161ee38893d4904f8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9799341173772d54b809741b964b9283a2f9920 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6dfab2a3baf466a6e721bd3bd6630b7cc1d13a844b8f166b14fd0fd3715970e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40af74a3547447140c18ba8f6f5884a01d09510d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d4f3d903695e943b83a9745e6bf163373e59568cb5c561d286b6d8e2b5a230b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f4214caaef7bb23dbf15745daa6c62bcef16350 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e7432111742dedf69ad0d2e39fd167778541648a9fef9632f30424e3e15e773 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0d70c8ffe89af88e9acd69404373e19fdca1456 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a701cc6e49c3cbf93b4c6838a5fb116416ed0e47663f9a707928dfdd8fb14e84 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ad4a6ebd9ce0b17fe7a3d9937921f61b5451c15 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ba9fc22e20b3d1cba312a20ff71f8f02eb631d937dfefb76f1fb58f16b83955 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..988e9c78059210065df7235248494c6f27ae9e0d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1d239e87bb8cfae1ae3e60eaeffe5d612984e6f1f4a6a8d625fab70884a446b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99dd6735984a391a5ad3c75c984848c8672023b9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f379190ed155b36f28278ee5321e9dfbd628a79e7b6c7c974710ab652e91b89 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..39de9a33c70e0ae2dacb8c4a8b7a2d15341a335b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:596fdb22e423ec125b5ca181214b707cf1ab494a7cf135dedacc07d151930bf5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..011ab4e9f986a3cb1b1fddf2a7780a28c72f7c8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:478ef60892be25c199dd58f8750c861f4b964e47d83534ec0cb8fb22214105cf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..20bb35a00fc2ce179ae79db2031e55f0bf095a4b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a46ff353221670f5b6c823890d136dd3b162a9c0fb10f52a372c7371b1864243 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53622f2523a386f22662065edcc2062f6385b485 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9984003dac8739f0b3c25180bf8aac1c8d74cf7a03e849f6745d5d6d3aed3b96 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5f3fc9a1faaf8e90cc3ee9ff32418b04fcad35a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4c334c58ca5a280219d0561e0f60ba5d6785c7573d4a1eb7b59eeb58a1b70f3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b444fb18be20c6cbb251e68e13a80a73e9985764 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6dd765f0884bed8f266a8752e538b558a55708aa9fea161d69918615da3afb7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64e6dfcefa4eda923a82c61d7642e7134a6e14c7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82e8658cfdcf6552e826584b1256a16827ac0df628ac946ac40b67fdc99a6f5b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd6b73054f8d85954230c4ec8a4e02ba6342a03a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a0dca1034c2a8c5a9ec0fec3203aa97100a543180e3fe68a94b557b89509dc1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6c1a9ecb14ea4c60681cb48795239cacfc55c2a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a612f88bd59bf6e24d180d7e479bed268ded0900278be9c80c67b01f106e23e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06a6c81b5b952f7428b64114f3fc23b90f756c27 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1960a05129edef00cb6cc6c1467f41a71acc8aca4c243609aead82578683778d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2e7e2588be6257224f953dbbb692529671c20f3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4301ffbea4a24eca5676453e6cc60a77ddc800585c5c17f6ebcc32ca927f6391 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec0ac68a74443f5f36d53583d8856e29a3f2a09a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d9236f4820ca4efd48b405da14311a9202bb8d1cd334613eb6eb2584cb6611b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb5d54d721fac391c63abb3e7787562f0f2f2b83 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c767652213533f524af5302159b64c296e1882745ad68d4576ea1bdeeb44c9c1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a10b1f467a7a20d5d8393b2fe4bdccd9cf0c4179 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40893394076cb76ddf88bc2f79d3ffeae43e2c693eba4c02107f48c28361bbd5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b4765aca757217ff3dc2838fe6dd3605803cfae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7b82e7f7e8f501fda4f44dca452ba8d085fa9d001023ee93584426eda4335de +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dde0296a8767cff0999d49bfda1293bcff35a60 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a3c7fc8f6c4b6ed073350acfb3fd186b147b3d423d637edac6d16a048e118f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca1669a95f13a4765e4c08eb961e8b64d048fa0f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0a5e4a25edbf1a6eb790c463cdf1b2e684524d3f6df16f0c7f6b8f85f49aae +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..663237040a0d997f52be0b6a6f5867b3cac15339 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:747e0b0447d06902db54694ea37df3b8d3b5d252ea94a7476913a423dda1bb80 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d430f16e3e1c6e07e9d5e0fa56c5b729391741d0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:159cb31dd752263d26deed4c4378d4e9678c515eb0e43a11bfe05587053b9070 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ec3e3031f30488f4ebfc0991901a2fe0b24b8c4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f3a508c46e1dbdae75f7c3872e95f9019dfb912862ccd64d645459163b7aaa6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c774744601f646b46f76c4f7f6762bfba421d068 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da795fb323bbd4d4ac75f771c0bc6611a7df9747c8e29a5de5d799b2d6e595ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9922ad2eed997f946957c777d9e06db1678bc08 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f013f8f7f37258cff53256590f62dd30c1620ce07b2c74e3e7eed84cff2df40b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..68d26c174050d23a0ffcf1a846052ef6ca6b2d82 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:073fe9a0bf2c1d3ac2d940641d85c706bfd805ab76c512454b4f37975b717934 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fd5a26b0ddfa6fddc733ef8f3db2746988baa6f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13256bb3da5421241f65fa0f6e126c29f3d08e519dde3bb45206f0d5176e7b2f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d323c826ec02aef2ba7f99283fc45512a66ac7d2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba0c40c9c939a66d33d0f1de3e12b8e97611a63ecbedb52436e1be55beb90d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dd5f86220c27464bff1dff6bb00a33b7bde1e9e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f64dc64c9ea3eb7329155acbcce0f2f4fd8ccbbb8d162c80e902fe22a1538e0d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0409b546fc98f8aeed1994ad689ae107117e9cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e91433eb8fdea730ef93222b1c58a31134a217784a74655b9c62acdc55f94c43 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f36dd1cd868f24903df21f4bcc0c57727b14edb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:175ef34666aa62bf6da6307cb71cca0cfdbfec9ccde739c2de5b429294790c7d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d687887ffb74058ad4b6fb8e94957bd61e0b499 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2621159849d974cdc0b2ae0a1a1f587cd8693d479525a2f93ccf3fd51d59094 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a76b223c205fb60773b124083a654597f8693c7d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fa18f6ab09a5b115be423429d214fb3debca52725b717fb71d5ed5de45802b4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bf35a1bc6f814f635f0178d72741e2f4e961e46 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ea0e894883305be00a32a7b74d61cf605cc5ca0619201b123887503dbfc6794 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3672caa56645469aaa679605cb06e7a8fd44b802 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4053e6c0327ed210ccff64df288805c54bd8d6eb8aeb95a4fb7e97d2696eb371 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b809f40f6f1ebf1a3ab922167bbd8b1040fd3bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1228f1db9eaebd6c7cbc2d2256e213c5550ec6eddbcf1d7a726ba6f4bdb7ccda +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0edda299d81b363a2fd5cfd5cf39eca2b5413341 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81993657ec9081fa537f642fea78f913d44071b35af993a49b8c52759f2dbdf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f647c5018f49cc30b1840c5260d9deb0fb8d5240 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d16e808e84eb97c3b93175e126b99ec0e326f422d298864eac65e43e6e8ca697 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc4ac3390b8da44234428db3e4dd36857a54fa7b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3a83692da7cf88a365f82c11ba47cb9fdbe878dd10a0f37b0af5f324c0501bf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1687e8168e18332dd9d326537d72d432b2ff502b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c280fec818d6b8be88adaf54299ff8c55ddbb49f5db7809af573cc5f8e6cb4b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60036e271a48361b016ef864167d6c888a552992 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9006cd8876311e61e76e0271e5afbc298ae7566a3a00e57cc3c381778c4c69aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..313ddc599279b7bd3ec4c31bca339f344a612a10 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96cc4d1cfe5630c9dc3420d5abe2f17dc6f5a56142a358fb1f19c26f2591d650 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91561d530ec03821b9fd3a252e9219b0d863a23e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41f70677022b38bcc972eb605bf3ced4b96cc2c40415ea095e27833fbece289d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aad37d2cedb448c5b12925e080ace89716b9b762 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c659dda61cffb0859451e59ddfdc36d6e935a052749b87ddc746e54e3f6193 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eeeaa692eec3616f0a3ddefdc7e06c9b30dc2aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b1b3fb8d1223ee967c1941a31b3cee3c44b7ac0c7aac6de76f5cf4afb6e3d28 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cc112608cd3bd8b0c21fdc69a09efeac8f5d1bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbdbe59a34a969705aa31704f96d69fe587d65779a179cf50adb2251331c4a8c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..887805623063a0cc12ae7d6cf84c79a5bb682a15 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c195eb1d1040ca79824a4c221c6383a6d075f0fafa313dbd044d8c62838ccbea +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79b5fc83023d5e22f9b3dfe8d4a92c7bafcc7d74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:699efa472cba94d159458c998fb8fe50917735b8835b217e76ea200a1712305d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c207981b4ec33f9ff08b20069d23d012d2b0bc88 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb03cf0efe8c2a25cb2124fb89defc99d694eb1e31db4a4aa26026b5beabdf3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b40a60d2cd001065915285c0ef1022df1944531c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b158dc98c872e61d31df368aea17f4b193de8363a57aa4a52f8882af1def388 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e343b21503980a1706a4af4376406f3f632ea9e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b0b7dabfee768cedbc50015a4dd7c44a1b884cde37639170ba91a0e3e1dbfb1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4cc771c3147d07bd36f88dd3507529a1eab8c85 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c20884e374bd0d8f3f193d5ab648603e39fed7a8639cae8339592a6e79968e40 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3342216c0e4b89df186554cf6cf9f22d64b03d54 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfe341ff8b6abde225837d86816749e319fa4e1b4cb05484f215aee4d0a75717 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50cf27ce741e96a1857404bae2e30364b8bda089 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8ec7da2ac971a872e4c25c52d137d48ce97ee94bf81468024a6fa877ddafba6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..454f5706a38a16a8467e313d9d957ebc2758e492 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca40ba47940b62697f33aa044ec0faaf0b71ce0f309d55fa8ff2c3ef300cb280 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c7ebdf8e39362532921c37e11e105e7cfc31a29 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:376b4c398ea0093beacb5e858e00639936a26f1153326b1d07e38922c8b17fc2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9e9c4c3bd1390f925c129efa5b0dc2dddb5ecd8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1818a5e788df81eb2acd0b5041a90ca75914d2bed08acc2f3b9f57e310ca9601 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a947ae93ca374be6aa887c7528f5a8518f70faf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:929fe57d0522e6bd94ab931342f82c7e76debf5f256e96fb116fe4c6ad9cd8a4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9308f9460aff2029170f811e755899c799289a35 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9195cd2188e165fac64e80606aa58e301a0d935c519ffa3b188a87eff5759cd6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..41a15231dd44e023881d56e048626d6c88ade47d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56002cdab9253ae4cb8ed68b4ba9f4eb91430074dc704bdfa7c29ff18af7737c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73ff8214ea03e8980de94e99ee2dff3a18297030 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71ba9225176bad458ae79f14ea8442fa8b71b4de5fe01ae98221eb7cc55bb37a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..da925626793fc8f17c3145a75bd646e425aecdab --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5cf6ab1a32a5dca9ff1e38ce1643cece787c3fe45bbcbf25e4695f7e18a4af +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a19bf9acafecc28c6b002fd3aad0735f21d3040 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8abcfd10e72c2bc0e97539212608eabaa7a53907256c4f25b47caa9e6f30ef85 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c48067ead5b799b45f80951fb04665b829d657f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa280ad219df5919620c15f282785b5ff94f0db0e7313619720ecec6db84cb0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27a5887e05a914eb9a7a36ee34adacdef0e773dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce955d58ffc9f3251e9923552ec766e8f22088563fed70f576bc54d80563873 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5046484bceac5c68d4b7264569fb3179391793d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd1846641518d52fe5900404eff081e8443c4e191507c2948f2070d71f8bdbcb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe1008f44d887402cf68759d085869bf2f2e41e0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e51b2208fe8a749f4184c16a69d1c949b3fa636fec6ecca9dfce2c89cf52ad3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c355d7b598a6bcf99007d6ac18b8f05c021bfcc8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17d42ab628a6b6b2936164008b760c162f586313140d62496ef41e380b9f349d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dcfca7b74ab6ca49ddeb62a2a37c9b427d97555 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4402428132db4cc6e2bf46f075d1171b51b45e02ed037d5347cf7e2ef5c57af +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e06121345c6a8d47ac2a7e502c5a13691d1bdf7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76d66fb6f3e18ca8dba24277e9ca971af0b9d6a89ff77826fd51e2769e156063 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1efddb214e6c05bde19764b9d9300c6ac023c3b2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad7ed9879b437c6354b88605ba4bc1a990e3ad180beef53cad9f4f0df87aa43 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c51319769dc7cfb52ea71d8f1b6005991156b495 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36806091dd2592df22e38fb8917b9bd7484fb6dafeda6b3b82f4722d0fee6c54 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5de31a22ea5fe8134a56e3af60c93dfca24e0586 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd6dff7605939155baaa48f7a335007fa1c2b19cd9f5b9eef85bc06228263fed +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55716f8ec4c637b2bbdfc5c94fcf96ab7d5c85ec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:122c074c41208d2d07372819a9b8261f34d854a8f394ded2fce146014e7ed862 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e724a58dcf437e1ddc7870de03ce92c0cca95c5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6d015e39aa75da0c298b2ac0d2a27eeb5005789451c755cd7a7184c60320c1d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69fc4a4675f589bf7387b8c86cfd670970b62e8e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:560f45b3ee455de91a45aeca5e4a0e25fee03b62ce4d6596846c61c5e5307dab +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5e3ff1b699bb12fca3df3a4c25c84b98dcf6b4b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ffeea2dabc8b62c2a4ac3825ef4a29f355a22b940cc36ac618bc7e6073d18d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e16738c37970d869ce55a8a7afa5462a7c7951f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:646e00c213b113afcaba80795d57c36969cd485e15d35e551a5eae04866fca3d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3499b6faf3933128a600d0d73c07d4158d89d7fb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30f9d07b59ec9dfc2616612552b323826a5fd60bd5a68cc40af4f7414c6fa1b7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/lm_head/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ffcc80504b2a8c2382580028a78294bf11253bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a7a96655e1866ca27e8083357ae1a7c48bf7c253cf08e272c0818a84dbbce2 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..988dac5d205087effe5cb582467eb3430c857e92 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c9b776a555ffdccf38a18c643f60775610386a0c5df4ff12e3172dc2aeeb2e7 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b56795ef44965c093a70484a58f042f08a6060a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aeacabeea574f4cc3f09e9840ae2e801f7195777895ce9458311d17a2f4d933 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..843a3b9c52a07e15dc088bb937b71ce6ec8ec195 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0438cdab8c44357b6186efb440c51077af505d29a6dc7b5895fd3f3ba9f27c53 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5b746cbb895795a135d8103a4fae0958683c9a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9839a80b252eed2841a82a2d17bdb08e2aff0691aa87669dcfc7123e5ed44224 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50026c58b9a849f79c183c932ebbc26ac47cdd0b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a6e41f81562efbf658be44d1b85c079d2b02f19a08a5a3473ad850f6000d419 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5007cc3ac4203d44d8bda20ea6dd686acfdea213 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8126beeb659ba5c91ea920bea1b66b714657120546f6a96195650c6245c0c0b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f61b93f2c69904a53511a4d87f80476c0a307de --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0439ec0dc8c8bb1edcb5d688579af81b83f1849209e4a45872b027a085d76218 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd36846f68791f530318f85edcbd00ddb68d54f2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fd6e4eec46c55d8f57ab770a198a5654ed35ffe80007e9983b8b303a80cac80 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b8b34c4d2c46d1844e62cfd48f36be97aee9c2c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65c7f36d9e1d6c5af9139ad08e2ced3218aa01b79304cd686f8aba55fb1be81c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdebd537f0872e8ab1b91360533bb95d6fe08101 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb75d96ff2fbd4a4059d31044e4fe6eb0a897532d6d784ff8a05933470962ab +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc3e34418fc8a9027a5803257045cacaaaec97b1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a526b343bc64d49fca1298e7b08bc58ccbeb1669c48c3537b2c92c8d249865e8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ecc369d23eae258d07c819e837fc1fcfedafbd4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9564f5f055fcba1a48e2826d5b01b094e3622e6bed59076cd8f6e285afa19f14 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8b19e21bedb37893fcbf5d730a78e063bfd17cc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00992dca2071978f51f8ecabaa4df2b6448a0d8c73ef959a667dbd6611e29197 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8e9df68862137dd3c08f3c46690c0f75ffbe4a6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49ade70013266b198989c62e7c3683a8896e43e1b0f3eb37b7270bd6189f5040 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f6b73c8f29c2e1875db325442ae85ed3e4ea795 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03517398c07d8eab4e9deaa8a97cc2aa39c8a0257e903b7a7a3cb291ffc73cd2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0421606263637bfdd86abd0903d2d212700d9c6c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:291244753b7d77ab38f0f93d59e045c1869b2b0edb1d0d640b92f775171ee21b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4fbd0070fcfda7cbf30885cb0f9522661c3e896 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1ccd9fb688c79e21ec84019d9a14cf28118dbfa49bd6b52e11f3d888845f029 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52b223e4ece81cf6dc1eb9dda985687538613560 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9499e5f6c8fdab0ade30d9c1939db4b0b867bb8ae691b4c3b43101db8b6b981 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecab2287794a71bb503fb1c7a7d0b3f8d294a17e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79f63a1e6c8e3d46ffb1fff193f633939c1b13420eb1f0910420d729faae57c5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4fb5fb87581b480ad40122ec6dbcdf804a67f80 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a75cbd8c2fe64c3445c3dd864a100fdb63685a757655cdfb41516c28679ddd8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b76888da013abf8b578c90c2c6240da083039ce0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f7334b5b5d0955f6473661ac30430aa46eb81f33a80a47f42855b313c7990d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de1103c106ab9f1954f160dd50fd4f456c74f07e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a80c65327c625642d035e8206bc9ca64e864c028d8b4a3406e8669b03c7215 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e726305b8bd927c0475fea7892ade384156756c9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9032838dfd1d86d06f2c7e1191fef678519708daaae4ba518dc5fdc3751f7020 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f648ec63f72859eae6cf249ca1bdf6b2459af643 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be739be2bc000e184df0c1906f2d27fde498622c58588e4f530aa1136b9ef0cb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9ab1ff5ea385e9a67f01292f7f87c69ad012562 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7063c02dda3e0eec95f6605cf9eb333a821436b1d7a92fd87d5de24d4685059 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40c14a937779f851f206d41fe29765e85d4bb0fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c9bcb6bcb600ffb07110a26456f23e9072bd867d488cf62cd3e265d161c7c3a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a7ea8a99d95b119fabb1b67d7d4238acc4783cc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d1e02c7237cc6ea0bef6f28cf66aa6da2f118e61b3295a68b9c526d28766d2e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e78441a6597e0dab69466daeed33a5293b1f84a8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b3e7eb322a43ae2b6315786610c817f0f41c6852b1b7fc363aa037415972584 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d19d769db166c624ffbf17d6626aeb87b881ff2a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26560d5e3301e3987452b498197562afce9cb6802fa7a2c3e2022df579851ad2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed242571b1fefaa3cdb4986a5bca9b4cf6f544d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5f2e6efa120d0f1f64f94c75254890788d379e8ffcaee39bd20d67cc73d476b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01295128ac9c9b71a0d5da3bb361c245bd94328d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d34057aa874e5b5419c389549c3ff3aea5b8b21f41b1ba8e00025ddc40831a20 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b26d1cf15af869e1104398eca8f51673dbe6678 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f1c18f7876c22f60318189c7d638560626d4ffe048ecf33ae1c889aa4468560 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72a8687078d19504396abe811d442ea3ed47c927 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a28deb40e46214cd8f6d13c2b65b00ccbf03608c3e6f38ca2171b7d4d0de440 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f64b04ec94adbad70f964b83b655e334be414741 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:049ca7738f944df051e00cf484a6f96e0df55359e5435b2a70a8b2ab2b044842 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25f874a580722ef4ddb6120a9ad1ca6a615cb822 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dccc4f474316f84f2fff81d5d09afcda04196e48de5096e5fc64081d3b301851 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70f0bdfdf7891c761fa6e2706fed2d49b8e84e52 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb5154de17cad2e2cf74e8e2def524bab84db099d4df1c9ba055c1f67e0d2f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9430a8497f7c3a342bef7526deca4fcb9f40d408 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a74ad8435afe0756834360e14eeffbd4e68b43defa8d92b08f35391bba96c2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bba7b05cc1f44a9c30a5eaf818943bf0850ef31 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e44b79ee2b542b5f233c6cee0cb92915aab5337ea93e338bb57caa3c1638e03 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a746276203119c791f6c72a803e3a4674be9bbb6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3feb125843191a9005eaabf98b0d137ff05d8b7a986cb8d7ce333905b96697bb +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52521906d041dcc80ae00f6e83d0f6d0ff135b24 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f6e4375255e00d6deddeba01225b23173c4226880309b4716baa58f71c57117 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bf84fb9fdd3040240a7fbad552ba1094510bd24 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1992390e3038dc78caeaff0f55e187b94395a633867df498f5990555096fc7f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae774dd9a8c6536c5e53e2d69ddb5426361c42d7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2e93b368bf17750f5a261d079bcbb1fb1b271cd23caf6284d9dd85c76a98aaf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d8fc96b94b2a698a01b80402a062d5f86581cbe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5167e0ba431da78662fb1d4198261ec3cafdecd46037fd95ed9126fa95a806d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7b31bd99af4800849299d9946ffbc21eb7526bd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df978fddc485faa40f955dcf967b776bc1c8364b458a3761b9f9173dacce708a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ad8087afbf4c358ff7145d51be01b4c80f79c1b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19cc8f21b315750ea869f026b11b36e7af1f57a4368626b03be182f4ef0b44bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7bb79ac8e46e0914457c003be586d1c3f5b30bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b020b4450fb788ad45b3c0040b7b6cab31513d3960950158bb239cac4914a836 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7451bb8fe699fa7654fb8f1236a47e55fe6f60da --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4df8ad234bf7d2356eb7daeaa742e674e09cd92b229ada0ccd24ce9706b3f174 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c960d060abeaf7ce97448e3516efa05e71a8d739 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:751687fab42425b2bea245f8a8671525106af756e938ee7b0ae4efa1a4f96548 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eb8163ef2f7e7ad5bbf06119070b68623cf5e79 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db436265b25198d02bc6c273edc91070baeedcfa4364512ea2d4f3bab06d606b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c79be80bb0f62eb3ed74d881582f0dc9b2db8b2d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4f5560154c52ef171b61d3ee6dd69828383eb2bdc204ea34ba5b4ea8333ae22 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15ad9b41fd720843831e443aabf001cefab1a731 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:780cbfdc6db6c438cfb74787277ffd17aa8da7670a5778b93bc8ca248b68109c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50fa609215d96a264bee61dec117f91e456f8972 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fbf6ec73fb95d09df890203db1fc0c7045e7e78292d27927f5828a1843dcb2a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf6f62b63f350c21356ae555008d67d3898a5a54 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59741c9b791c92427d378e41771072a6125c399fd59aaf8671d27758b994d704 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40c962ea5b5843ad46e86845e5efc9faeb74d7a6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ff766c7860363db3345488140cc19f504f100be87fc100a0ce4163cf76753ed +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ad7322308b9f5c78e945407724b6f68d7b51707 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25101798dfd59fad6b557854edff6474fcdd5af6f714b1bd643d85b5d5939e45 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..725724f24f20d8c41f09c0227d65d5dcde846eb6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ae6c94c080b16a0f48c356648b3605c0fa0ff6bfc5b174612814d91ddd382ea +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11082af1f21a60a0cf183aab59027a913dcef4b9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b0c82b1a3d5fe2d2b18652debb52f3abcc4cee64317715d0d0248414b1f75e8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e543143c69db97f67b1f37f6b797a65fed2f2d65 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e183270f9a8364e6a39279ddd2566eb1ecc07ec8591d6bd7af885c646aa1ce9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49bb242497f6d8b30e834543f06d8b6dee0c85ae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2f2201b05f16f087a1ee73438dac29acc272bd3b985812ead626ef4819f6478 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e2c58b06b4360a7fab58ea5de32a3c67b186ace --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b13557d760a92317a352afef5d1f207bbeba519259a0459a702bdab02070d9e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cdcd15d9a1bd5dabee3b4d38bfcf7345d91fe4a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f641b00ff253f5360c14dc5f9725581ad4ca92b8a777b4561ab08e58603ae3f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d3d9d91645a9356d143e8da1f865bb99585aa51 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62bb46b3cd22648deff2d27ccb00c8d2facbd0ee6538b630258e656e4d6efe28 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93fff08c058073ccb62bb097939a90c3827cdaa1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78013711ee3348b24c7e0d53cd699492e226a9557a86dceb5be1615a559afaf5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a80d9cf7b031f9948ea122c265e9b37eeb739d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6883888cbe7762f7bf2456e1ef4bd576995c409a44a8160c497a4c9ef13edba0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a01e11c8594bb67f3b6ad985b7c911153ba9a29 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6db691fd43bcb1b22a3cca5b3c7c1d00ba8c3f28afb536f909a1f8d76027f80 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c9f2f45a2f3fb85d0bf7d7cbf656ff3baaab98b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec49e38d0626dfaa780ea4945d79654c7ea39e701f0b7cb3c7dc2b03f8484c61 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fde4451d0e027ac2f1b7cd87708e2fc64173628e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a2e50a76b771fefeeb2fc935f68a464d66361fcf18dea4c4638f91c8b286dd9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2496ad7985a64f67e52e3d77e5012ed6d7161b3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ce064f3a0dcfc67afa916f18486e88899de923ddcbae29838100a9259b2e5bf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ba8fb01c01f007373d38ab444ed4396a0996900 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09a7b0d014ab26237367ec2176a71ef0665c5de40d68ff0097774f16d66056b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bda96c0b5f755f01c7f08c0b96060b62f4e4b8f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2d88ad6a9edae88c03bf8b8548b164cd2a7d3e5248f8f805dda59b6ad4796cb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eabd91819cb4b5cff415da9ec559fe2d1715cf88 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1118bf13353481d8a89468e09853a9cec3d6aa59ccac88aee941251ea86cc1b0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9650197a6b27234ec42c0d9ac44724359395069 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a7d54e92810866ac9019352d79419a6681ee75c8fb379b3d66c2740837fe0c3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d073e3195d04865b46b1c2320eda5fbbefd64f0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae9eae3ec0a52470443673996d1e075d96419e091f0ccb15c8f5c8b5ba6ccf5a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..44f4d94eb442241922ae510f6caf65d9328a0aa9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81fb7b6555eac4cad3cd91a9f2d28d72e859f6bbd8ee1a3e700fbc1b55701e8a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddcbec2d6dad55f24479bb77fd227399109ec577 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7311dd0063edae7fe935afb7848a39b7388b4be4a504636592ca6e4513862977 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46275a0f003fc732a0ccdff3685f5a29cd66cc23 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1adff4177f51e5f28d2021e3364b2830469fe3a8122358af55e469d5f01f3067 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3796f321c3957855c14a8360ce151f67a2e8adcf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:552845132945995eaa6dd2dfd112cba10eb6e2e2ab454d34425bc61ff641fc1d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa098a0accd632e032c8576197c0a1b7589f5991 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d1f1758b38c5872a75a60c20de341261adf161f35b33c688b3d9f14dc508ae4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..954de5722de95fedfbb117c72a6acd66e945d29a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f45fb8e0a8f06c92ab0e2df1961140aedbdd547a3ef6de1e4f22ef2ae4084652 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0131db10449661f87b57a2594e485164359e07f4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:830abea3d751f0467ce4205ec07cc434afa1d60fb2d706817352028835d01dc1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9c7374598a6914fbf5d28e6f0a65da3bf77f5be --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddd78590ca4ac2a874a2f019877017f5133826b395f840b03435068690edbeaf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e9b558fedc7f9d091f5327878aaaf6d3e311abe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0f98824f6d8adcc9059364a9af9cc62be0f14078ba049fbb8cf6f4368e2304 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5df377baf08a6947a57f39b9fb769484b13d18e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f02c8f13acbbd848441e5298a2a5ce93afd1461531c743109ac41d1bca5e15a4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..17ec02cd5405c7c16e70339848b9a86d6900ee44 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d52e2231237e6600809647703291e457d10e60d1bc040946944415d6cfa1d873 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2adfb2dca75f1ee2fb47d86061b70acbdce30a39 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e9a6b89febd3b31b54d6fab0f1826010a869e8e0c334eb95228d5fb6e7a5faa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5935deeca256cf387f4812e13b6a51fe18d72ec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:138b2bb13fd000b587b6a2989272ab66a28ce92e42ab1ac25bf5f3421806feed +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbfaf4a0401ddbd7678b54b8610677cb158365f8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39efe56c07b119e6bfbe7c937d245ee17ec39339ae9acb0c2b46afeee5966bf1 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..87e26bd0531939d97a806ac8c193ad627496e666 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad646c0b7623a7ece9f3d65fff4506f99ceeb70222aa242fbe530f6e8de22772 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69665038f9130735ae8974fb4fc8f4880c787fc0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85b893b239c23c2d4858a07b99d483c2c0046811527e44be368206a3743620a5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c038320bf0941e0ed00eb8276704afbf13d568e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cda2f2c7451d62ac5a91f411324069a2843f72d76d390c2e61dc80a52f4247b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd11ba457f902df386e57bfdc03f733b65fe4237 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62212a8f1ea73a1fcdb256d7d492a176dae50515c424b0cbb158c9cd486823d5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d46c28b673e2a090e58f6a16f8a639ff468db8cc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64acf712f8a5cbe7d130e78a062aaa58967a4a953efa08d1641da820ff654b01 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4ebe13e2f292b4f90421219b183b86a1e7a3741 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e6d60e1cd8e368aec1088daea1d99bd78be7f9e08bbd7efb42ffba96656c7c3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28a5fb58248bc5b0de9b94f25adb97f477b30e0a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:922c7c4ba99a0a240787389de55355de1b7e87679fdb33d1f2eca70cefce1604 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1efaa09ecca7a3ba3724bc1b398a3ce52b1be6f1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e30db5668ac4b639dceae5b63a20e55029f166a5e465c92431048245a102a18 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba8609b4cd95b42ad1f105e234aa824cd2937431 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0d7ad61c2d9a4a1f851d3401606837f19c2868ae46c832f365566425a13bf13 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cadf0e0cefbf33c6e12c0dc2b4ab529fc98f01b6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d2f3dfc3b026ae3f6db75bc6f47ebe0cc48469aa19042c134cfb9e86220af69 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f3c5239316e66370a9037368f7bd11accebb4f1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c28492859902961e194c2ac17a4d4be89b862cce35ba369ffe48e4f1895d7c4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fa7354ae9588bef07ad75fce20cc87dc1a4ee6c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bbc5431d43785754eb6250710e63bf094419d51558ad045344c81d91cacbb61 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..438dfa52ebed9c6389837972f7bcbe269ccc151d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51623d469bcef7ea1108709cec39824a0d9084e3a345c66069e712631830ec7b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb5283dfccbd6a7efa7e6eda04d63103894ff51a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:671c292fb0bb36d57194fabd792d1c97ccf0779ca6cf901f805457c33eb42dd2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..847f583079089a9da2c36f84be20f45e165bf763 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9810647bdfd67fe6f88e69378d979152d114de938298b63bf3537788114eaac1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9fe6ab63f084f0ffa3a4e824b51e2ad6fa576b6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4823799828370b734e044275a62086939cba08233b9d7c3b160bcd8d23f1d793 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc435743d1d1b8de146e245f2fece44f94c4be27 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ce39526171aca0f8afbf249cf5790bf9da0d7d667ffac0f7b14d765ced81c1b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c0fd792e04bfceecbe2e07802a004053fef699b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d827de2d0856d6aa9200163668924a93b51fef55d6a5718ce924c9b976e6c7a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..24008a87403b843910fcf2b38166163c55200c9d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd2d7130d13ce3724d126bfdade4d13cbbb8adb7d8ec807febff4b7cba824240 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..184c82001fedc9abc34d63534f4eb677393b1e81 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55004bd34312238afea077a391f5fc71356d038f558377a275d671512eaf79a1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..05dd483b9e32eb76b081bba8915331b97dd1acf8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24bab3434dbce17124bc33da712bb8c6c44977b472ebb9a058f4a73b8b7fd379 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4227b0377477fcdeedbabc25b7da8459fa207ed3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a3350a3438c05d25cbfe2eb368a6111ad39f2d683b1efb170345a4a58b25a05 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b45d49cfcf24444f3a6a9dca80d8597f1e12c0da --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fa0c03f647dc6d3d65bf5c189c0ce2cc2990c415279a6b69d74b4c8cb24395e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db36225eeff6ba6682a210f3adcee60ba49a5af1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b64c0851121123a5b2d0cd03bf8630bfa8ff77078c86fadceb0a72f5b48c7825 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f947b484e8de7998895a8448f29089f2fbe2aa2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f11490ae465ed2b3d4e1f42cd5de3aa05d2b7cb0f6dddefb55e5d191a123b10 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6db8e6ee4cba85e1a447dd866a101c05dee1ddc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:152cb9588cf99b396dc370c22ebb2541d2bd7451f03f96c1da0bf813c73a0b1b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3835bfeb9c907670371f0f77d9378f9b5526b531 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35fc2da5f2ed9c765c908315ac54e92656937c48a77b83da86156e1dc2edf7b3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..715ab1627e920a06d95810696758a031dd880910 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fb703ddf73528a9f8d2b7bf45854cbf5588e5c543dbfa49fa78f455b94879e6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfe1c489bda38d73e7acd0f9272f0a313d46becc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f8babe7f16f2d8cb5aa812460f9a26fbfa513982e5a5091e7eb0a6ea3daeeb7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e30a0825ac913c58a11d2296becc45277db6ec74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b8c2dcb7809e2791d79c936f46d7ddca8e1d30272eff3dfa7aa14b89673851 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dc6bec36d49d8bcc45a7b23120fd50beed88389 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdffdb9fc9e0f59458b925127d9918a8ef7385b5173dcb01a79b5203a62e40bb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7997d36501224395cf9d53b5f7863ba2274d5d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e57e7c73b5380ef7a5a071b205c716e526f4245e803b484623e61563b641724e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9323cfd9113f73950ae54a3adaec1d551cfd02d9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8afe062f8985582748c444d44a28437e848d420f3180c219cc1bbafb03db3ca4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2399e39ab3ceba2db9c6d26d31286876d440dcc6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:007b1ccf07249c571a0f0bfb60833991dd8fb94b276f1bde714162598b03c287 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ccfdd8d1168db86754858df7d0486b9f058e1af --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f48804560f5b83ed3946bc5ac57b9ba196f884c0c76142a83256e82013050f9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..428402c480570525ee7a6fa7e9bc519552e691f6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3812d589580ffc3ee2f2c9ce09226f2ebcd8ef2312eadc1b359c719499bf29a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7454e3e7e58356987cedfb6d425a539731c58221 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0476cf6671e6456d88d7db52d0f20ab5818fcb17af450460fd65f91665d65f3a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b357e12cb03f14eb7ed665f2a8bc04258ae8d7ec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9433628d5d6035bf1483698c601f766451669cc988022d5f6537f75e0bd5a4b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cad5c13863885d61921a6087f4180b4a9dc5a06a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b9952083ce9a7a613d1260ba47bc99c3085a4700b70aa5adf062b35fb466420 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb3baccb00cdb4f5f1430e0197c960eac87246b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c23f378a3d60121a9bebf35b50f21f004770f2f9f5fc505f4e76d6c640b24d3f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0fe5fa84c7b02981f422d9aa5a6508ef4095b16 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59502293417a9a9c5f997d4dae11f290a5e2671f40ce6e6cdd3671fa9ebc22f7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a82109e02d7bc0bb029440e9f1e29743a3a9ccf9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fb97a9ecde081b49c55f39afea09e1c375c61bc253a996fb51a3fb36287b297 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0611987013bece1404980b38ee0051feb0c5bc0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30af1473434e859dbba6200766e0f1935814160c55c9ee1c9af00bbd35634e39 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c691f67ecf1f0d5b299e7049eb6e8c7e2e98b33 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad4991f09f2e61897b83597c8adbd0edf71ed23839c67d3dc2b1f6f9334955a8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03479189f67396fed16c98f5142168767208d6ae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:375f3ca7f50837fa2f2554faf1b97c71762551410cd3f369a8049163154907ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4058488930fcb1e70dc1e65e42d8951870cd789f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78357cf5356a6a9eda6a3714a88a0a5fa5a022309bcc158ae6fbf92aef7643c0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9d38cf3faf7dbd9629989a00ff6acc4cf380730 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4379d9dab4d1be052c540dcfa54c6211cbc10a11f5d10810fa2ad6729e766e8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18d9c84242095718a075aea0cde3c1023e7fd24c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e2095990a5b57514dcf07b25c6afa5e9c8a3930bfd4b5b74cbb4e83612d064d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7702ed107354deeb10247364cb99f8384162b70d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2f2757cfbec9398b82ba759948128eb3e7f33d1ff8cd690857276f40f926a93 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac1bbece1b8c8da277ce3d6d4145ba6e373b06c8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adfafb942cfd07fb625457f90a38223b069bb725e06f721988f7195c0c47f771 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c43e3f1cae3db56fb26f808a7544c600fbc39e12 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b34270dee1cb539cc066ef59be7168c3317ec9b718d3251228335ab9390eb6a5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ba237fe3acbfdec762f52cc2c1eb27739bed9c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eaa4bcb438329027f4605ae37d51feb1179575bd375a2e649dde6e26961e916 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa149f5e893005df87caed6611b30224a425f1b5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b86fef4e1f6e4db2cbf61e5b8c9ca0828899c8cac05db6c8db85687518c48cba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9f93d7df38c9284a24124873f29ff1a24d62764 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5207981eb439b6d55fdbcd070884fb21736d136a5cc1faa09ff6cb8cebfa963a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4228e057fe7b5e327b2e3fd34fde493455b7c28a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b944da4c3370c9b1c4c8abc5a15e252f10f28aa156f35f0011ade1d10a5b7684 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22646adf023fcc904cb100925fde2cc6ec6bffe5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac52128ae76919f0d9c21d55d1fa0f3203de4130b86dcd9d7cbd3556bcb0f891 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0632b3a0e4081fc1cbd2a150cc4f7afc6893a20 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9368b95dc6f83f203bcc9782d12e849f3eca5ac393cc101f4186d1047903163 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1d9f1d5ab65f6ecf66acc4863a9c1017915938d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:049dd0699e0d84cbb5912b925a585927b76e183056402fe6070119fb5e22c729 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d573b296c97bcc89b8e725c7eec6d58d0a6a442b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69517ef9b12c59908e77c2fd2685d986c3d3b53020482c95401f19c777a932f9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12ee619fa2493d523a96a7dc6da0ac0461abc432 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:305e8cc709379e9483c22f8e4287aa811f8e33639e522309cc5b3aaaa8791b0e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e9b21fc9e5d36e13f7f60b5608c5e25739e6884 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e884a2e00d26a7c0a18f04aa32e2c04cdcea22afcdca0d01460253412bbc18de +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77f0c38f855a6f17e080e87a2887dfd67e1a10e0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d631a93f440b203b74f3713ba12699253d536c8a14eff5e1be8d39a0045dd11 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b523092c8861225a45e8caa0f6f302ef298feee5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbfa798bf47042956ddaa19a68d3ffb08e03792e8e0edfe09956637afc3bf98e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..367f1077680550a722832a9dd8cb3a5cb841b193 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af6c124c07b1ee8686ecd5c42e324d3cad8feb54ec1c360b848e16567568d0a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ccf189b4ce43576a1b42c238bef593701452907 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42d2ba57b910019ffa991ccdb4973a95d416da9d0c389e4f2458d7ff731c728e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af805eb75b409f0284429919887d405f95c0d528 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92a2ceb2da9a18a39f5d4373a57bf1f0e94d1c880fde5f37d1ee9bf165d8d7cb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ab9f9c999ba384a4017ccac3b78da816e6a3d36 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce71f2ec0b76d6c91ab17f0a99badb2572cd689a3bcc0b0c3254d6376154aa77 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1073e8a7fdb68f20ffbc780fccb1ea2be04c0d35 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba97b9c70e4deec4dc9db825c68913068956171b17375acd677dc930b8fd781d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c518b4deda97455d514ab1c66051221b2e6d3ff9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18b2a6a740a58658587b07bdff8a3b291e4eabccbcdd11bf14649ec3d0242cd7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f529d45dc6c3a12ca965451aa14067e3668fdadc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08dbb7f798222d48cac08509cc8529f870b53873f42fc4cac129623b2d3d4f31 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0d60659164c966d601dcf37dd2f4ec3af7c651a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fd7ec34f1b4cc6761e1dde21dd4be3fb348c54cb3bac364ebcc1c7af124e143 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98e254149bb9914d707e869b53cfc36542f5d511 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45dc9b1e2fd54ad7fce31316f98947cc1494a36ce01fa9e54a6818e1cf66e9dc +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9f0a9a718bd8277100b6ed63b092ce7dcd78597 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa07e5dfdbae6548216c224b6df61bdc1c0c30aa525c93b3b723ca9ad3ae311 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09ed6997d176e2db7ac1a4b5f286443c0461536a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10d598c46e13d69e134da33a78379a03725f1f701d327647dccfed28afa65467 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28a3bc483fe3b524c63e62a27beac9849ed946d2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66de49ec74e566dab789a3076293d03f78289f030b54b0f089ad41d11127a341 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30cc11901a1e6d76176ca8208b4d6105fb028ef5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:228b389213f39fe9ecb051c8d1f420d09f3c36f89840daeb5bb1150e743ece16 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b85605116975f818f02dce4b92e3e6e6489845cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bd719b2841f44033aefe3a540e6df6f31c3ba14501ab022d291179b9894a21a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84a19004c26a3fc6e97226e577c9a0bc35ea9508 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:994799b699c7d524b2fb8c90f960c51bc01c2e7718b4ac7033c067ac61668256 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a1d4f3eb783e56af9caae6e7bcc6f8c236484b3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e723938401226ec78d64d30f0a3acd0f0214aa5acee160b7acd04705a6d82cc0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..351f3bef33820531f86f6e3b1e43b37684ab016d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0567cbaeec6e7c0f85cc301e76683b9bcfb94310af6ac6ef2d74265805e6bb61 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f08cfcb9e16478d7ef6e2b66b7253e4d90b8808 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:347dc0993b0108170032f7d32210b6c9b27f38735e3659fd9d98456e29a48586 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c73305ae1826196aff17e5a5618467de251ef888 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f33be04a667512502541a6ba5373016b5f87dfbd653393da3671d84d078ef9c9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..41ef762645faf46c88ebb6d6f6e95d6fd47275aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f93f47ae532a1967f474b2b6a6c8bea9ef550ae0f59350842ace50a7b6e384b8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fb1f523b105bd47c81818a80dc881c15b926f8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c62a2e6f54d72e54f68edb241cde602ba37df563b7e2bd75ca90c003a17005bc +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7e85a7d68c12cd50e9915669957470a093e3dcc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a24ecea5e2d765c91221d8ac64e47492f6b2e22b699a4cbb20c4eef2b1b1f481 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe1fbd1660271a5d5294945c4dacf21cf631894d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bacc27168ab85676dcf77c7eb42ee5062662d705de111f93d1da88dfb40cefff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e72c395f85e28c69ac8a3f7bf6e5fd81e1f29589 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd8f2a63fe48f97b826b3bc6408d35089eea9b6d6ec4897162ae42a39ceeeb9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d8d413b4af68ca449efb66753a109a79786ddf9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:538d98473e7674da8702688b85801c3483cb4a170f7c223a96e28fd4b5dde395 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3b4a78f8eb03a34db37b8c5acd583b651a105de --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ef44b979fea4200d56271d158203cb77d89747c5ae744f7c2b36f66454a2ede +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23461132a01a2fcf1ec5c5eac5e527c1be29b942 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4360e38413fe3d7cfe8caa6bc6aee669e71e3a13ae99c6853fa2d8f8b602983 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d736d139cdcadedcd029a3514ddaa39aa7ed2b26 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9148c18e62297b4d537b4f6ff2597c261ce094da38bdfc1e1e9348d5199208b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3d3e92138dc83a718a5a5c065b2ff1dfe1129b1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8de152e85e831d103ca1be7c3aae96bbcfdb7e1d93764de8a8295d33709edc4e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaecbdd1fe6bc9ad8e4d1b1d5c773229ad845f21 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd5d869a5a968596ff98596525ccd4af6ad0c4ed5583d95aeb60248f9d93e75 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eec88ecbd9e54dfa1297465c00cd57d195e9edfd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43d9eafef2df76a5ce03f40e9e0541554c99efeb4d0df86051869f3190c95df8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f1153c791afc538598bc323bf72e9055eeffa49 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03eff7b06f848e451e269728e02fbd76cc7b0df7823a6b7fcb0b7919dafe81ca +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b275d4c7f510b15d859584ca2b6c6fd179ceb5c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:933ae63bc5c2881cdcf8db9f976362c6503230ef5fbafc402c4e335adec2e312 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b96c09fd8e11ac14a8bcb3a44ebed1c4ee93ae7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2413058283b2d0b630c86920b941cc6658e5e792956b6877012b01340d347abd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd2df3e26d17c593c9722f2914663c0978b4620d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d49716c969841a7b96f3e34221ae4271496aae12779775e6887bfcdabce342 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03836837c38a9cf59d5a6c52afea81abd5ef7489 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:118966e564822d39ff4183843fe7274114c11f691d43177c5247d4244a492e08 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf0874b0e77fbd2862a79fc31169060093b4c860 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73e1787c0739c42d4c8c3c8d3459d9f3e08ce820d1770404502d59ceb1c060f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d104a4a0c0eeb733a2d394c455d5d25cf521173 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f282c437f21c5c46ecc98f0bea2acffa799c37cf4314f7192fd92ee86f218c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40be1f58b49c9e18773ba827200cdeedfd225a31 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ed66eea0ff0c36ec59e85395c96cf629c1db564a57f3154899f085da895e312 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e432185bbede3e64d93ce541bb9b74148772b04e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed17d2afe4c36af6ee59148662904dfd1136da13eb5bc40b0000b1fa090dc493 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..498abfece268d5e8dd4e6bd6b89789c595579e1e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc917e35e2cdcb4c4b2f9cbd52eb778e43098b11b4d2811dbcbb23bc139e463 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77fe417e7f5d7394e570d184f113166199e3ddef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68c1d872903601aeaf3435c510dbdc7779977c1c7febf13f576614bcedd26f34 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3298dd9afd4a091e82a11b9431738891cc59190b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc0eb6213ac387d71278952528f6d382efe05e2e3a6f4c8c030f4ebef0b3766b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed19ff07cf143f56332e578b0f18f46139a9be42 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b252c1aa9c55eaea7c2fc174fe651938c0d6338286a68a18247c09a760c4f040 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eb50b0c80604f9c5481ed1894f242c787299b60 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:349b32d01d233a3aba8d9565a675f64c198f231842287db7b8b3cb17db99a685 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..707ddbafb6e1c6079c57c27d5ab4f4acba261842 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84583e44ced8c9779c50e53e1469a1f945c38347953147f65638401dec55e5a6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4ed84cdda5b7e0615e365d81a5cb55f576f0928 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3c09be21cdda44de1b5c80f50c1f30de8ed4adde64cf4939bb374ea443bc5e3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d0bbc7400547f7f3474eb65ee205b46f28d8d6c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:052d437b0e0dad7ff05710bdf926c96887801b16f3a15d5a993bc71bb3000c05 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5882f4a0382ddd2be5acf5255d6957f20b9eb4bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4708b7dc4980532b3e79f9a02e387e80838161c69cfbdd3a32ad4d3dc551dc3a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..caacb90bed37f1acb75759a3aee5dbd0f16ed207 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a33383bfb402442476088cd11b89175e0394fdc25c28ae14ca8fa2cabf3450b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e21ab42ccdfb5bf8b3a306adcc4c04d263b4bfc4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d681a4019784d037ebb81ef22a564cedcd704428cff61b82353bf67ea8d7bec2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4087b8daded6ddd8b2ecffc74cbf66e15aa251e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7d55b236f58059b03a477262288cafebeb1d85656dd317c9dcce6310c220841 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4052db10b93155a0843f3d36df0a8cc142efe0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac2f438e67af3650533eae9116092e7756012775aceff5d6375368396a8959d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9b20d592913e5fb478326b7b4c76b3f3132fe59 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfb432c5b0146ee427ec9e777ad558715352dc606e989ef3d1122c6d0411f226 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f6be52cecd710ef7ea28a8d0bd1157846605f9f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35346b3f391293df1a42a8be1aa412d47b2cc7b82b270386713611dc6b7d4626 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..83f2551ac3a8f22299f3b2515eec138e27c13156 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134145e95f27a30c433cb09450ff52b7f3c3faadca15145f2eb7403924275994 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb3be746e2bf36d7cc2ab075cb3f014206515bd5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cfde03eec4baf61d99467cccba0fb0b0cec00685463680c991c34ffedc5a053 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb254ba516d778266e8f90fc8314ed68fd543566 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2de595695c42a73b71a155cb40d9b3f46cd871b1542eef9ecf3c701af3a685e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c7855827dd932dfd2a398d2507928f1892a9ebc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d97673a134e83430951c513158e2aaddd1f3d6f06cba436905b99c67932dcf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2125a50887d4363b8eb6cd6c58c8a736efd19f29 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b9c6d201a69cb07eca7603b72adb12f9d10a4532e8ade761abe12ed2f337bc0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39d5a069581cf8c5ac512c7c5e9328c45ffae863 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2222a51107262111b082284e8a099ab86ba04f392fb961f9e7c4a229ec36e2e0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00a642b280678f5c88022ccd1e3f1a217b6c3b8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20e908412161d22420f38b6a6bd43df1e7c18e8fd9d97cf89f651a0716638bd6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec9408313f0b6e9ad3ad99c025a62bc4640dd632 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:debca2edd025b49c723a9d5c000b7e14c538bdddff91429dda2c7c8219c9ee03 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b339dc8cc49d0f64df0cc233de4c0002958be325 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13de512a793a2ad8df12177e5b281b6b2caefd172283d0ad07c914e58cf03172 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b755fd84110742d051acf4827e508aad12fc0e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ae61ea5aa3162c784f3b8a521acf4ac79ac23a89ddf3900fd4d76470b6dca6e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3d2fa7ce0c264e0b3639a88b68042f82ea94a6a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:687fe89ab811bc1f3baced3e6454cbcb23eea870d0d8a183ff0ed310c5c6895e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fcadabc620db3c99282465d13bf1eadd37c9b2e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85b8f25b7593961f40f4fca738fb2ad454131322bcb2774353753ff4648a64e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf660501c264c80afa470282c3bd0c6fc6ba0613 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f7ba68689080630ca753964b21387d1573b988b54fe5e899709efecb176a51 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..130306f5bfc336ff3182a93d58484d93a8862a69 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10dd6106be932a829c70b504c780eeced8c81796cca02d1a1cbf1729f4f93fff +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7b539e51147831fcbf2f6065a45e77600cc4862 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb92e7ec1bb5d1f5f66469eb5ed5ce8fcb9b993665e48fda43a97c74055d9165 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c9c8c2212708a344f68025911905c480e3c21d4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:420a0c503aaeb3273472e688f6c8413e54a65afd2c65d259508402a80534e17a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6faddc4987e0157c4ca781093a20af11ddaa47e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22124b806ee3b2981896d0ff2595920bacd6572d1ccfc1d0d6e09b8439b700f7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3d2742891e4542b20361aa6aacc7a59e79d79d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10752b7b2d3d77941fd51af3ea0029405702032d57b2e72470716a23f4315637 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb3614c4cc519a3ae0275160b306f35de8ae2c85 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81c6c83e481a3bae0d24e206728be69143b0be3ff4611dec693f742edfc9e8b9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d36f1296d3170d26a45fcac444f34538d7f076c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2e6b0d9315cafe457163761e7cc5558b1ebc3a62ecc81bc9942004b83163f05 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc1a54aaa6d74f7651020f6aeedb1cc1b338a91d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e53a442a23bd3b3696f3b7191ea5d881a8681171209674d41c529f18e5aaa791 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc7b74d3c0bc81e99730164b9392ab998b0fefac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c2c2297cb16bf4b89ecc7d6f1b3c4f5772a271467daf477631ca319b98f1791 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..36d96c9db93161e8d2aeb5ca532966f2e79714cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f4b37ea08a1a90e80224340d5f85be8a6e7831b277ac52f2feadbdedec25aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41641c1417ca2063ac4d14f0fe651a002370e140 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ff3bb73869b7adecf9e794eaa927aa543270baf263efb758d491dcf48cff63 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..968b5315fc4d3e71c46e8da4148107e427aebdfe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6064fb393f40c13a283a3a19094ce8a143c90d78dedc643a7b0cd6f6ed194922 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1e4e7e3376b6348d7e813cb7e9126e06ab23c04 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fc0526cfbc1ffee0982dcf8be428e46fcca3d959368f6c50efa9f715f42ab76 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e671dde993c976d2130ba51a0295f6ca7e87efc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a42854c4c5468b15ab85a1d520b8a874bd9b276df3e9b0dd6d1245d7889324a4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0542e86deb92f0b08d7aff942850294276b17250 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11ce537bd240c680231c9fa47b3ea9f81f05a3a3099de7307f0e996b05fdccfa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8867bae8e2518d07a737b8ff2dfc42989ad1c42c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6173c282b934ad2fc94b67e2b3711a236ad2a79bf332027d430995445a8c5eba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f42f340ca5ae8079649ad95df95eb3c9b58852f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d486fa704a69f5ed98076306971381d83ab81ac7d86f595e67c50c9bf589fae1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e3b6fee70b8803af4d3ab2629960aa80310704d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b433dd65ef431c1593f0e563768db54138ce6b10cc6634f3f3a4ac78145bb930 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63bbe023e3a56b95b804b59bee645c477296cf67 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baa8fdac3b3a9feaf63af4839b9e19ebfe823a1f707849866bc241808184f93d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..000dc9c74ca654ed5f01b86e9fface417c15190f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79af8a142421a4f105cd8ae283acbef33032ae064d06333dcad3a8f452ea85f0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dd42c375b335be594c68ff4e763f1dd0c6ba732 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b1a434742169cab032b3a01f1aa8b3e2c1125a303529a359d9a636a40b78183 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b8a763b6aaddde413be3a0a0901e2524253a021 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ef9abb17765251459dae825b000f375d8aecc027622996a6943131badf1967 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d2a3651ecebe1d2e3b5241c5b8f3be62a72b906 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bcc1a8e259e433feb3064d7e7ca15ce7be343829bfef73044906395dd55a200 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad59d95126a367fd8d99faf779b3cd3a57b02f07 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c633a4b0f945a76248a5a407e96a150a437ceeba1ca009159c77813e69dd9e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..798e447ca81240a7ebbf23b9938bd6c839cdff98 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce5df8ac09513346ced9d304bcf522384c59f7c4c0cbb3054edb8f0d902e731 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..04cf732ce6d86054b4c82ccb0f685f3ea79b19d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb7d696e1f8269a32cc8c08193e4042361ec966c8f946107a179502dc2a6d170 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0f7792a76df2cc61cb1e7f28e4401f57a5a92ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcb36b17b15484bcf2d6d3e1726dd0308d75d7f4eac2e5abe10f68725c7619e8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf2ae06a2402aabd3b83944bfb4fb1b1b654d152 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed3c3114ca151e2a798c8e8131bb47e033846f455d717b03cef8607dd2a3232 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05b2586549f5c6230a1a6f060d1e8ca340c1a6b4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d9d6a57379d438c73d03c8c0d841e5c06843cd389ecfa09cb501af0291751ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28ef6e0ab96a92873e5a3597923a17a9ca3b0edf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794bd89f21166e9961f0314400b1bbf13604d8291d0940078bac9514ff8479c8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d818657137f3ada7789c0c37fb829e1e684e02e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f20658ce3a1de1e41f872dee986f4663b58dd710c319a99b472f632653aa0e7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcc1b5cb5e3055e3ad29f5df3b77b2e6a3a8a834 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d4e09476f2a8d3bf04a573e8ab8fea9ff6f4383606ec5da728f4fd141713b97 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a62854e77967783c0e928e931f6e846c645fd24 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b3d89845955889c6299b7bd5200711d04f97aa33172bfd3cb8d21a79fdbfca9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3359840735e54705716c89042b01d76c6a158b4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:782696687ca8ffb10e613e7da1b5175133bd4753c309d8c6e8d057eaa9d4a65d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a786a60ad586d521f8c69db7907f96c9e9701697 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02265723d2b02b71d8e52e3a6f03ff9d67fa6a448037ae3067c18f33a9cacdc5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b391d7c28b966355f396f4d73e15f189fa9035a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb451e3c5291da7ff286b5b5d761e89d89180f6e03a1cdf1b6ddfa551be85d8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f51717130f7732da0e36328455c276d6b1e9853 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a2f1d9a01efd8ade88c4ec3e664344f8c3a38cb73ae282f7a8cfdd1c5937e15 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d55530afc6182ae536cf998a636d1e86743cb369 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab4f17189b9ee7a85f951802ace99de2d2866b051473a7cd3ca7c9112e49b521 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb776d469e612f04c19edb1afee886118138c5c4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d041fbeabd8bbf66aabeeeb5ef9720e9b32552cc52a20277287ff2da7ddcf8e4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07bcc87936238a9aa235604b6d21d7bf5de720bd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc3f9872c233f1ae2738d402b7b5a5bc2cfad5c4759a090bcbf569616cc4cab6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd7230fbd02d45b206b9137e8d3c2242b78aadbd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f5be8c8b8601a904a2eb4c3596dac42cbfb84393c7819d592a0da653a14dcc2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca45c3aede6c753c89b303483d8c1612733a38b4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f727243e62190c5f12f66003bfed58d76c66d813538c8142d0d135ae2bdb8cc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42b8bc1c622e19a9971238b42a86c96faa3c8648 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af50b678512917b45d4676d8ae9899957093cf636083bf03a2e840eebb65327 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7753195ba86fdab986dc07c4e8d3c31b43089bbd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7355bc5aff6a0a1ac1a4599a7b542aed05c11ab51c5e5017f6948f74bab81abc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..535fc5af18677ecb177cb4d1575d549785aadfe5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c43f8ccf1eaf97d733bf9e4904ae90de575e9b67512e963f93b386019288d96d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eccb4ae340854523bd4e37a308143d6c2565c075 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff393a61f1850dcc18ad365770fcfd0643c1659a453d555057e2fd948900599 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aa7fd917bb2243e589452e30690aeeb04eadeaa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2051dec177e8d65c1b2b44138d0316b7c7d14926b6cb36983aee91abb68340bb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2063dfc6ccec6e63e137f0fd984ca5af9479fba0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72caede3df97e395c9a5309155ce97e2c5fc4fa1238e4f1c879be249b2b677df +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..240be56de3114a079a4fbd744e055fc4bd78209d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4940d975ea532179825f518e547afef4b6e55d56448e5eb075da069a050adb3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2224714ebc6673191b6ac7a94f7d5219c020d267 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23986e74ebc4b01450150cef42a4ec2b89a515e5adbf7ec4c341f31000ed8b09 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4b1a9ce6b87751fd489a30865f1bea893d302cc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8605d2a626c4820cfa9cb9349e6f8158d33a4a47170035a25f370d0577067ec +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e07aef01578883c9bfa2abd87e2ea609f28144b5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84ce498b71da0947f0e654f7028f7b5008942f965cd131236d84579bbda1439d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9a9a282041eff4bc67a27dad7e772319529283e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5295198d3ba171074584dd98ad36c01b5a94bda4acd3e06aeb259d45c9269c29 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..649c1a6dea326bf1f2f3d21330287a0d04384fea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e37b336c6bf1cee504edf06c139f75847b3114ad324d9fddf5e812e0055f7921 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..890351c38b0c95b4d146be042821cb8c3f82726b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02851c6b79242c6589c5566b4fe41b6360f36eb7ab9a7a26eb51ffc345b02141 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..97491943ab560aa4b3cbadefeab3d35ea243fe3d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1a67151db411f9cb6798839d006195dea9801806861f2cc54103f34f88589f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32f3e3bc1d71bef1e81f9aa0794ecc9fd403c777 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:157974dcf89c22db9ab585ca075483829500033f2e1ec68167ee93b874a6a85c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b74c7b306ca996a201937bab6d9e1679b03dc6c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5549bcd754d10a7aeeda2e3b52af7407feabaefe9130aeb3265ac6472ed119d1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a863346039c8c4447069b004a0dfdf438c34ca19 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc7eb8457d05412734714540d92b163a324518b5e6199e5186676a66ac066fd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..acb3e706ee18a60cddb6baae182ee6defabd4ad1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01a42aa206a812a84b2ebdf52434480e25d28538b88b47c23b42a99bfbe5868a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89b5945d84475904998dbd195da80170e36089d2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:396cedafc6aef6c4d09185166701cb875eea91ca954322cd9bace9bc3683d7b3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cee64ef4fe96ac95b2dab5b577bf52e9daaa96be --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e145614994de6973a10ddc8b2704e72405c9fc7015630c70e5afe41606bd0353 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1705b4b1fb91fe15a82c39ea6e777564b38da072 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cba028170cf15b740a65b2782c2bc93ce911f2cd02e0bf8758105a2dd9b9390 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..918814369e20d549c1176fd968e6d305ad59eadc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14c4ccae87d3ccd291d042e3c3a400ceaad4d0e80d7fb737ad8b43c345fc7164 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7893a1ef2bdefe4db47e2e45f6119e1ec2577c86 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2dfd7da7df38c6d203bb5a2030fc452f57fa1e8547845231f3f7b6548bd0b98 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..534794fcc0b6a440a29caf9c5b8693a3e4c3dad4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4405ce0cadda84dc8dc88a605da65f058ca70871ef2c299fec9657a9a3adbbf7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0715a55a380db9af7934f6c57ab9d0ec739f6e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c52dae4eb007b472baf9711bc4f6e7ef9786f2b98d5b0c9a67c5f7a3dacfebf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df31d48ccb3936f828d82e5d07b363446e80961f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb255ec4f09946e7e25294919da4e57299041831f1984d9136d4b51c6641bab +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21c76de2b9f68f9912514b08b5400b427952321d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3551d7499de891e434a6fd2c329d6827c52393bc4154bf3313e7591d865b62ca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4231d1a07008b818579ac070ed402289514cb56 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05997c07bc7db977dcb1d13035b90b191a0daba4d7b25ed1408674e1296da924 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62055d2f82dae78adbff531fa919c0a461be276d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00389036081ab52cfda2958cec9c3b18cabfce7a31ae8fc11fe5c6117a83a212 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33b2f74afb6e5d97e5ece6683ebfb95d389dfe1e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7346f6571508937cbf3e0628cddc80adaad23881b0624464e1f3682bc8f197 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..779c4f5bf6d36d64f47f13efb6b7b1da1d7e169f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79bad9ad3bf3c065332b60e54caa1ed4d20ee37bce3a213c8e9dc646ecd0dd11 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71297f3207256ad7bff29397e4c6bad0dff61a9a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a9525b5fc29f58dca27d2e7ea4dbb180c67336bf1f68910a55a04277b1e8521 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45cc50baad52ffcccf792181312bf80c42e2e62f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fc531fd32e9b5d12594c53d98c862703da6361e756dadb57874e939687cf9f2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e511236b757b77765f8830317ac7ccd9f48f503 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc2cd22fdce57ec8279ed3658e4466cf023749c6caecb81e03a74ad274db1542 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94500487be94d4c7ad3caaaad02d975dc8d6f29a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e70ea13b2bfb03e285906a53c3c5c30c752a80faefb18fa97bfd4aade77ea5f6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..152899143db0bf9f3c3542fc2dd901367d46560c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad9ceb84059cc0a78b5d96951bdeed1cd49093ffaabc1d3102c1c96400794584 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..054a7420ea8dbb1bee768f87b42e0fadb7195d5e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18baad3d3b56d7c9199f6098bacffd368c9e417801907072897dd3785d17bc9a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..979a3a7996526e1dc5d050992ac8c9699a7204b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:683080e1178012dbeb4d95bfa4e06ab441c4812fe8a7129052ba28e61ae007b2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6bd0245ebc982390a64a21862c932cb84ca2dd5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62796fed2b111634ca7525bfcc0dc8de19ff5625f0e2f20fcc02759c1d4a3156 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..253187d1f8a919866fa716ad3cdc8ef4833a96ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd2d2822b1202e26a540ebd6804b363a398b206733f545b0f15db4cccf8101d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d762da66b6759b7530d7c2cddff5ca571bf0a65d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f99e8be8dfe7638f1d4781b1e45340c469fd7d8d8843b9788fe9ce937e461059 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..464a2eea5d206d2a660353bab6ef5edf282c44c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f864ed2c59076a15a8fb0b88fa75463ff04429d07d6c551161ee38893d4904f8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62338a0a339be663f6e01c59d8cee118882bf182 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3248f2c3121ed90669daa7a28b0c7e6386e4bd70896320095a2c0b39f022567b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40af74a3547447140c18ba8f6f5884a01d09510d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d4f3d903695e943b83a9745e6bf163373e59568cb5c561d286b6d8e2b5a230b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91b90116cf3a19168e8d75c4a5da4ec9a18d35e7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bb1678941aa3f074733591d71f3a2276b5df054749e871999047b2c2810f079 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0d70c8ffe89af88e9acd69404373e19fdca1456 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a701cc6e49c3cbf93b4c6838a5fb116416ed0e47663f9a707928dfdd8fb14e84 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab1948e21f4609cef625d171b0318ab8b80eb97b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acd82499ee9e40f2ac5f9adfe2d3d82e733175c2f1ed33c982d0f4e10a1b69fc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..19c9c5ae4e26764e68d816f4b3f46fa435ac9ddf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10c880429b229ceca69e9ec28f0aae7c6341e172aebade7a1e0a4b55830f6e28 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e39cae0c2f0cb4b2b2e4c83d1737e3ea5ce0cacc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb8643e3f77899cf4826e18945c4408f82721df205956ad567e1e3481dfea644 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..62df0634edc8bd3f773d076413e66526efe4319e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8e8cbf4d2ace8091af8c94c00d495856ca3daae2883535ab6233f37087f2c0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b15fbbd9c74d81fea455d7982e1f41babe5f2f75 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:809202580fcbc6ace51805550f588fdc83c4d3a422b2acfc1ac7be709e91a742 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..20bb35a00fc2ce179ae79db2031e55f0bf095a4b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a46ff353221670f5b6c823890d136dd3b162a9c0fb10f52a372c7371b1864243 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0734f17a8e3f31a38fc923514776367d77d04c82 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1312d9ff33f4d4ea7fc849fc9f4eee00a5845d9d108e3a5caea2bbe7e9ce393 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5f3fc9a1faaf8e90cc3ee9ff32418b04fcad35a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4c334c58ca5a280219d0561e0f60ba5d6785c7573d4a1eb7b59eeb58a1b70f3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cff65725f51490173a75f554e8cd90435a62ef4a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e98732f65a7f177db8071aa5d3e1584668ff9d9773c454e66155725f1d1425ed +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64e6dfcefa4eda923a82c61d7642e7134a6e14c7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82e8658cfdcf6552e826584b1256a16827ac0df628ac946ac40b67fdc99a6f5b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e05d2affd0233cd3417ffe27fc5e29e415e82c8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63261960d8c7393c36bbde1f55decdd93f8238c792fc83b188dd8466245a73da +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6c1a9ecb14ea4c60681cb48795239cacfc55c2a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a612f88bd59bf6e24d180d7e479bed268ded0900278be9c80c67b01f106e23e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba0fb60fe75fc7ff824b4748d3de2a442a792f00 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0891181ff3c622671ab3638a0581aef3f22477201444b7a1a3ccff4911d48406 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2e7e2588be6257224f953dbbb692529671c20f3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4301ffbea4a24eca5676453e6cc60a77ddc800585c5c17f6ebcc32ca927f6391 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b02a34c85f2a1424460e987ab012b305d1fd4474 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2e2e7d612d9a0e308e5bf1dad558b0a0840d2f0ce515abfc79db1d7463f041e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb5d54d721fac391c63abb3e7787562f0f2f2b83 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c767652213533f524af5302159b64c296e1882745ad68d4576ea1bdeeb44c9c1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6945bbe81a696c65242c610b45ede80dde9b9be1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:536eebeedccbfa032c2f3bab8bce41aeb1ea28020fa5e014ee122a3784bc64b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b4765aca757217ff3dc2838fe6dd3605803cfae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7b82e7f7e8f501fda4f44dca452ba8d085fa9d001023ee93584426eda4335de +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7e2cf37f6c5d4e73e18db6fe634365525307f5c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ff35b4648d7842b14e086845edd0ecc75be2a9da5972f5ed4eeaa761c0e0d8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca1669a95f13a4765e4c08eb961e8b64d048fa0f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0a5e4a25edbf1a6eb790c463cdf1b2e684524d3f6df16f0c7f6b8f85f49aae +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16f87baebcde22cd22cfa39f95b4d353cd87b621 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdc140edab6e3e5775dc0e6af4980ffb9ef08fe4d943230fed050c379246a917 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d430f16e3e1c6e07e9d5e0fa56c5b729391741d0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:159cb31dd752263d26deed4c4378d4e9678c515eb0e43a11bfe05587053b9070 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ec3e3031f30488f4ebfc0991901a2fe0b24b8c4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f3a508c46e1dbdae75f7c3872e95f9019dfb912862ccd64d645459163b7aaa6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c774744601f646b46f76c4f7f6762bfba421d068 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da795fb323bbd4d4ac75f771c0bc6611a7df9747c8e29a5de5d799b2d6e595ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e07e5bdf9a7fabd2b5621fa69ef8fec58333904f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cb5433404f8bc4115a9dac7539fe879c917013f18faf18e292a2b121fdeab2c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..68d26c174050d23a0ffcf1a846052ef6ca6b2d82 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:073fe9a0bf2c1d3ac2d940641d85c706bfd805ab76c512454b4f37975b717934 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b279067f912a8a8280b29385935968cf9559bd2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07171154acaad7a3f48b846631df52905f4d612a013c1bba198ca7f6f2458ddb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d323c826ec02aef2ba7f99283fc45512a66ac7d2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba0c40c9c939a66d33d0f1de3e12b8e97611a63ecbedb52436e1be55beb90d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d52c4276e031c917ace917916e936fd5605168b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f53b4e1d88ef03b0ae08ba08c0aed4679633d18ddb15be1e419770226f261b3e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0409b546fc98f8aeed1994ad689ae107117e9cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e91433eb8fdea730ef93222b1c58a31134a217784a74655b9c62acdc55f94c43 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..367afa45c9393ec490fbf5c5a988b804a4096cfe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f98953a18b54712ba1572bc297a783a37426d498d29c731c54be1abcb776831 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d687887ffb74058ad4b6fb8e94957bd61e0b499 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2621159849d974cdc0b2ae0a1a1f587cd8693d479525a2f93ccf3fd51d59094 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19f609e28c9e61d16815b36e5dacd25b8c79bbd3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cda77291544e9fc6c374694bbb522ed0956d521d2c3695feac06f1124ca92b97 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bf35a1bc6f814f635f0178d72741e2f4e961e46 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ea0e894883305be00a32a7b74d61cf605cc5ca0619201b123887503dbfc6794 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4019feb251b85caacdb553dfaebb2ac48aa385ac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53b7063ef56c07915520e9158c93e68e0e42c10a419dd26860ab65f44d6ca3e1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b809f40f6f1ebf1a3ab922167bbd8b1040fd3bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1228f1db9eaebd6c7cbc2d2256e213c5550ec6eddbcf1d7a726ba6f4bdb7ccda +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34629cb2f4ce4737193ae1309e7438b3d25155dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf8986c7d3ffc924c4c50937ef98102d5dd69852d7bfa2e6ce17f2b5881ae6bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f647c5018f49cc30b1840c5260d9deb0fb8d5240 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d16e808e84eb97c3b93175e126b99ec0e326f422d298864eac65e43e6e8ca697 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b560f1190231a9ff86b7cb7346c1e3fb746d1d42 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:646b3d826f42a5be7ef68806691187dd97ffe94f9288665f845da4c278a2ba04 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1687e8168e18332dd9d326537d72d432b2ff502b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c280fec818d6b8be88adaf54299ff8c55ddbb49f5db7809af573cc5f8e6cb4b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..089ef4b89edd2cd4e11cbb1a4608681572c8c5e7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973cda3948ac2bd2e38e780409ee0fba6ef1db23834493ad4af1a8907ec72065 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..313ddc599279b7bd3ec4c31bca339f344a612a10 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96cc4d1cfe5630c9dc3420d5abe2f17dc6f5a56142a358fb1f19c26f2591d650 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccce2eabf4ffdd7b4846204b7a6416342852bac7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d5bfffdb7262ebf7a2c619dfb2f00009b786fadb61abb5f5440baf0c2231902 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aad37d2cedb448c5b12925e080ace89716b9b762 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c659dda61cffb0859451e59ddfdc36d6e935a052749b87ddc746e54e3f6193 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50db053feb7d4a70831f1a453053ae574d04c55a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a85b3738e562a03fb4a98fc331d221facbd790ebd2555169e82174f7c80be3f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cc112608cd3bd8b0c21fdc69a09efeac8f5d1bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbdbe59a34a969705aa31704f96d69fe587d65779a179cf50adb2251331c4a8c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a63b7f5acc8d894680dfa9e51be806cf02136d7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e7b48fdd5dd41a6d0b0ecaf88bf027dbd94d67ae924574ade51e56c3e031738 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79b5fc83023d5e22f9b3dfe8d4a92c7bafcc7d74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:699efa472cba94d159458c998fb8fe50917735b8835b217e76ea200a1712305d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0bd75a96f201ed832ad6b0a16226a8e40d7fe84 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69f5f74932ef2e4cda364b43c2dc18cf0020f4c86f8a80dfd08b93981d8dfabc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b40a60d2cd001065915285c0ef1022df1944531c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b158dc98c872e61d31df368aea17f4b193de8363a57aa4a52f8882af1def388 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb06c02b24062444f3007f118d08cecef099439f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c24f31e5ca21a53dd028c2073e897ba0050fe427b70471b6581cee590210ff62 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4cc771c3147d07bd36f88dd3507529a1eab8c85 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c20884e374bd0d8f3f193d5ab648603e39fed7a8639cae8339592a6e79968e40 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1de226e2b28d6b62068b0e7a081db39e2bd8db7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ba2dddf3813d074d6ea743b501068633fceedad273da55f7d274bcaa7a13d52 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50cf27ce741e96a1857404bae2e30364b8bda089 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8ec7da2ac971a872e4c25c52d137d48ce97ee94bf81468024a6fa877ddafba6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bf0d8513c8588b6da9fdb3be6745453c023f5fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feb6b5abfcd96121df0e9d30b6cc5651938480d8053b2c0943a12785f3ef968b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c7ebdf8e39362532921c37e11e105e7cfc31a29 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:376b4c398ea0093beacb5e858e00639936a26f1153326b1d07e38922c8b17fc2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6bfa835e8b17f34deea71b75fb93d0968e310ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcc5852c21f3e3b6fb0f5558d93667a1e0f4f5702e07a71c00ce6c78fdb8ff5a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a947ae93ca374be6aa887c7528f5a8518f70faf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:929fe57d0522e6bd94ab931342f82c7e76debf5f256e96fb116fe4c6ad9cd8a4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6984b45f1669795bc65fbc38d736211361b938a5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4846b8b51ab2017ef54b374e8c8cee3a4f28da7de610538ab418a17c9d72b563 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..41a15231dd44e023881d56e048626d6c88ade47d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56002cdab9253ae4cb8ed68b4ba9f4eb91430074dc704bdfa7c29ff18af7737c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..047a541ee9e85c3d74ffcbfa68eabca3f1d3d7ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5491ca8520b53093da72d1d8e5757a2509399562b6fa55a1400a747b31f65a5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..da925626793fc8f17c3145a75bd646e425aecdab --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5cf6ab1a32a5dca9ff1e38ce1643cece787c3fe45bbcbf25e4695f7e18a4af +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bd729efd27f3c0f3e994ae4819ffb1330c9a23f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c52769409557bb867027ff0ab2fc85af6bea38e8a0c11cf35dd714e38a1639ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c48067ead5b799b45f80951fb04665b829d657f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa280ad219df5919620c15f282785b5ff94f0db0e7313619720ecec6db84cb0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6444f4ef07d23cf53608caeebe452e703df02ac8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5a8a3b46eaef54db8d3a4311f2e2461657aa561d706cf7d3d42c6bce246b873 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5046484bceac5c68d4b7264569fb3179391793d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd1846641518d52fe5900404eff081e8443c4e191507c2948f2070d71f8bdbcb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14b3e51983fa2d291211c60df1a6642171333761 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3337230478203b80c9eef27a426cc209dc17335f4620e7b7910daa874c57b074 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c355d7b598a6bcf99007d6ac18b8f05c021bfcc8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17d42ab628a6b6b2936164008b760c162f586313140d62496ef41e380b9f349d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bfc86b1b20f751312d9e920a32388eef6986d21 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:586b57f2b64463d3f6567c41be028d68d23b66cfe2189ffc071f29f6557c21cf +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e06121345c6a8d47ac2a7e502c5a13691d1bdf7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76d66fb6f3e18ca8dba24277e9ca971af0b9d6a89ff77826fd51e2769e156063 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..871574da98dfd210764033f849b625552eb317f9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6aebc1003b36f7a94ea2c2c7c04b26fb914858d3e05208061fe397c2501b922 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c51319769dc7cfb52ea71d8f1b6005991156b495 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36806091dd2592df22e38fb8917b9bd7484fb6dafeda6b3b82f4722d0fee6c54 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9620ccd99997ae79b28775cc5f34488a918eaa08 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4280752e72b5e92368dcf1c8c18ea271c69a72ddf8700dd65b290ec402cbc5b7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55716f8ec4c637b2bbdfc5c94fcf96ab7d5c85ec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:122c074c41208d2d07372819a9b8261f34d854a8f394ded2fce146014e7ed862 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97e2357b43d62c4d1a1635e3697e4e667b1ee07c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d4a39013550c3dd6a3d7dac7d9aa09793cdb5fdfd76c20e055cd83dd4b3649e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69fc4a4675f589bf7387b8c86cfd670970b62e8e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:560f45b3ee455de91a45aeca5e4a0e25fee03b62ce4d6596846c61c5e5307dab +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55bc4b3ae73358756d232a8730a780e037408cf8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a19b5cc95e32484887251116106bef1b5cecc1620af1b6c18ea879ea716d7e7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e16738c37970d869ce55a8a7afa5462a7c7951f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:646e00c213b113afcaba80795d57c36969cd485e15d35e551a5eae04866fca3d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2845360107ff26654ffb029b106eaac550c2d626 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_5/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:477dbb2c9c67a2f5370dc40bec288a6a7d2d5f8acd2c76c80f0222cca11015b4 +size 11395