diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f208135249737db5da606170a20783b4cda4235 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:645047f57abac43d8d993e1e1a2df86ba20a4a220024a11be907b15cd670b7ab +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a00cf2a60a2b31ab5872f451127527814e14218 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:400e131d474439206381972812b72675da9bba3d960a979ccc7666baa56ee485 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb2cf8f430e396c6ea431ad03b92383963a87112 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ab43114e14a515ec8b39cf3d34a3895439345b5ec79ba001d8e5d998934630d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fe0ba1ccc9e955bb43611fd9f449c1cf3c63b46 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab456d5bc6581e818bc7fb09825f70a4f334c3f299da1554d0bc312757294f2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..436458743337707f2b380d4b17ce2cdaf2a00f46 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3adbc8c06b26c53c83d6b74eeb07f89919a253a937c1b8615c674a4323363c3a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7584d9921a2ad00d2b77746cb91f0dbbf94f2434 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c3a59469eeb3b84ba20fd2e28792f69b07f4aa8bcfc38c50701071c6bbc083 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a9492586b67f14161f6b7ac42ca252538cd085c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ecb4bcbad586be843a596caf1d2784caf0e85e9aeccedc6c707224bb8fe8574 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9e7d8247a135c64ed6429a350a784db7f1e8ed9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05a79d8be40d25258ce59d2e798163b74cca2de3d15f4f96d0e4a28170ecdffe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e662eb914f27a19596e40b53e73e12bd70ec769 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7bf9fe78267a2f8f9cee478b398d8b110c33c1ac7c87640b3c6c76ab1508950 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a5d63e02216e5f4eb8c0f3e96884f84b1bd14cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d649e0a85ec9227bfce8e07196794fa618c54c4cdc8fa56b70d247ddfa344f4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d557ec43b6cc22246ac786113708b8fb60505445 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7762fc81aa5f7b2ca0acbdae55b4dd562d9c6517a374d1d8c3005b3e026f8341 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6607456a42e14f86510dda4e2929773756e027aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b6fd39bb09c0dec82505d75eebf6f6e38cbff2c745c4355c042c0466d738c31 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb926b851ec3795dc65adfd133259ea6c22437b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a26c5c646d2e66c363193b1be80c98935a3ccf276cf787bb47924aad571f03a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7c36354cf9b9c84d09c2f19f5fa6417ed60bdf8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:527fcb4f38487e9d18849b03ef36721bfa36a317186a3ee58993a7f11d040e4c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6290def28f8bc7ae4b9dba5be67842a9700e7080 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:897d1082a8695bfad407478c5858bb5b1f91de5d048d28ae04926e3cd0f0c992 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6db4eafbe0c224955f46346ea816180e633c317 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fd8992c962d618cec301eb2820035f4228cb17008ef5ccafaf6ac3130d25d4a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a103d69972785a0a4f3455f7c7b7d8ac038263f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75b01c8f9a379878f44889d4b9e981149e2e4450904e0c45ce52199eaa73b296 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb5a88a960b41bb430c0a7661c4cb78b1fa9327e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09b58f8d4edcc96de6055cff64cf48739ab2fd787da0270fe3b67a0629be5924 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..865218b8bae38656cc45222fb147e4f32ba2b963 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58c341e65440d50c70219e03c365612aeb2cd07850bb070ab94722af8156100f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a2cecc2a9b2f9f9ec5c7603e7012629c5f99f00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a38078d517bd7fdbab4070582531004e62feba2573c6fc16d8bd4d11301bf34d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3313407e322edca0c67a126f49dac793529f0669 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087e876d52012a40d35bcb3b61d8f0d9279ef2f39d14dac88103445dffa7e4c4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cfcde50368941e846867f1a0c04fc8025dc6fda --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f501063bcb37d2dd5826e71a3ea4c794137777eda2adb76a916244a43b1a0ce4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a4a84ae3e43df15d120786cb54937c59c8ac9fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ba26a1c0b8ad8a02cd42db09445743a1954baccf61d691b5291c90de50a787f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15cef6d798ce17425265688ee9c68db4a166b6aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42fe49e81419131f9c724f9bf23a63319503db742d7276a2cf1737b19fffba6c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6272d1ed1b8eb571717244df606ce8d6b3e9d181 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5a0236f9aae8f39e62e66c9c8eecc923fb3dfa1edb2d228ce56436c3b3f4a0b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..44d5fb3d084d37f2be1ab34169cb66ddbf974f92 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1d23a5f7493ae8bb670042c7106ebf316d1e6cca8cbfd5df1091a09fad67153 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a7e8aaffec2d4fc11ca1532f85330821378330a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2d206385b4389ecff16e0d16fd5e8ef6b26a587ab93b7030c8158e22c737696 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1149dec0421a068d2530ba718b85db7917be9f9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f7d695158d2843305cd4c7ec645069569036291bee0109bba4e9b27ad06215 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0978b86610c1a38adefeef9f44af59a15a575f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cea78eaae5a87360f8309828f37fdce9e7c86bef69b8e722780179043340b168 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..09c133464d61f1a653edfa08234f2525718d8091 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9adf110f25eed3b8875d127fc26cef758658fedb5d82262fff034c738cfd3cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07f243694798a3f5e513eef493806ca70ba156e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87cd3f0492b14dce98c45c2f5a0709f388420d86bf4c4bbae538047cc7a9d1ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d531fde0c6ffc365fa60b60694574ef2ad21bdd5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18cc3c6f821158b00c733edda0569b777517eba8120eabf31eaf892f8a15fabb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22db1fe61c36292986c3d33ccfde620f5d392663 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eba1b1d058ea2ee20db4d4236af5f722731159ce6f5acbb0704d28a107f314f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48637f888dbe93a2a9cf5c120039c9af85a06ae7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c80f083d2c93cabaf2dbb24cfca36cf35f90bede70ac9a2a539d591476680ec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b79f90621a462fc50f7bd21e9d646b8f931b90fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f30ac48e80bcafd3cbfb720200fc8fcfa9f896a56b879bf995673b077005758e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b2ad741fc023f28994f16f88f5b9c492a8dcd07 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b49f1888f769e76a819b1b3479a5d6c4c14b851d81853ac205a6651c156d61e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f410e31728df473a923a8541d1c75f4b25f4418 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ccdd724a1113abc65ccad67c8826b5dbcac6f8024918bd52c2d1b96ddedd6c0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c38f6d7977f62fa53081901506be3c54e20cddef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1369dbc0f6253539ca9fa8c5ccbd466d9d0e846b94846e20cfd2db9495d314a0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31d80af5510dd879eee2d005d4c3734b1c5c680b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48a5a47133c2ecd030f5f437a5fec88f517396ee53c5a36e0bf8c501e60304fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d17a90bd03214092ff4c6628ed76758fbf8e3bec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95781d585a8fb2150414fe6507b98348a490b142d362a4f6f0ff347087c39d9b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8ecc50b6c1859f126b3bcd679d87a684a77f348 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb04daa838b47a374828c4afd6aa6fa301a5864e1cbbc39cce81e70402d4fd9a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30346385aa844094be65a4c148451e22c71d8baa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14ee582c7d0fe678dbb25502c2d49ab45eccc200998044151f684fdd8ec9a7c3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c8fc838874298fc87c12219dd79f6c55e185af4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09db76002b66968a57d560d5ce83999f365da7fd115262febc198cb00472d0b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..489eb1edbd6382f25ed7a0c34b94884f7b564cf0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75ce0b586f894898fbb6bbfe45fe92b62edad52c79f0b3db051970dc7fc21f53 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c2a1e9eaacc8059b497959ab71ffb3202795cbb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e0982bc6bf953e11bce306aa9eb2b086ef21341f3a825ce57db834da2e36dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f46679838ae0ec1f6751d401517fffaae6953aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa0953e6b6b018c12371b2937ada65be6e164711b7de3b1cfed39a286dea177e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c7e347c0ae7a0339386edb2d2658920deb4eb0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d237fab021c525ec1a9e4c323fd767bb2b7fe225932229e99b2122ebeb1ed9c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69a698f00dd210ae6a743ef2734549460cd2fb42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c2cf58f280fd132885badadaf6ce8e55a4e47d422b7d8d43b20c2a3e56b59ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bf7bc9c21b51647a7cab234ac73ccc634b13e22 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e9f3dcc000922290675d23e7354c1066dd9d34842e445e929a15fd6cf911a1c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..da205d695f78fe839174a51c3ad3147ca0196c53 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db7e839d2fbb34c0fcda1e90a513b05e7e62d2f785d179ed6717af96d99334f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44739502dac8900bc26354d97e87f625ba297235 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ddf38bc05529905d26ff5ac54d29338bb5d1208f3ac87fac3f0b609d7e6c0f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aefeb40fda5648be1005d52ab19cb691bcdb5833 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b3f138a04e082ee647e88c80a0cff2081efc4c758b80b2e8d0a3ead235c080 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02322b14a27b23eb1fe3705aad548e00363b91b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af5250faf864866af8ca828a8426f5aa10e1ad4d9d8f1af95748b3b51509e788 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31bbf92e5e63e0d1418fc5b7dd1b90d734740baf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cae801c161bc841e61a44a6e026a7e40dd9264e547250f5f6aa451e0cb95ce6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1686d99be9d9df6f94e38f919838ebf315539713 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce3888d0432044ba45b959b23b50dd7f21bc80333ede8b99351d5da0b62ad1ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6d7e20b42ec07725cf8d44ba76c84066e48fc28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0086a7b5428e807ad42e7bb42d456ac8e3a66a123aecd72e7c165c971dfe06e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fd1871b07f65037b00b2d42b233a9628274291f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54ff83573569bc941774c74a962801ee772dcf3095ddbcadf4e5c587442653e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18cd9718cc3f20e9db18f95748858ebc756897eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:888654adf6322d2b25e4f0a4d2a70d81691099c6741516414535284ab5a27176 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e66f2aaf0ceed8dd0ea9fb5059f20390c9737c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8b53630931d1d929a3c58e9fbcd8608daa613c95140b55263e0d2dd7db37281 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..233bb2f67be047383e75dc6891e7d26c7e5f161b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:937dad6f18a0df353c906578b720c2f1575b0fdd51b9d1294bebc9e3887b5e56 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eee4bbe7c4a9f20cddeb2b9199b8ebbf3aa31c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40f08d9bb09fb9025c30a24202feec1eb46210bdbeb28dba78bb1bd9c22340ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd88c498b07d1b97f8454720aa87f7292c1ffa73 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e326c281370fd48dcf40c5ebc61f5adea75eeb4703e98aa207bda2584bf8aee6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d81e5dfabfc9bd00a74f5cc0e7abb87a6868c96b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a38d31db8b9b529c10282ca53512a6cf0c7023e86a283073859015908a4af3b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fceef06d7e244ff04fe42f4654688e7d33da957 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d155c186337b54217d49897a7da9d989d63e727cd60de4056d6524089ea3e7ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0a4d92933100f351651e169942d0fed8e1c0451 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d743e2e6610a3466ace08a68390ca6a3367bf595ef74d3ad03d9968dc0e9d46 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e198043a51d8928dfea42f8214dc1b8e7a024681 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52edd7e950711cd3075f6315df586a3c29593e75497961a1d04256092b4ba2ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86cbf9903ef7e61d5d1e6b0da068527b01d43e52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87ea328412118fcab570cbf8bf03473647c3b770fa8322d9c95ae84749cbd76c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7550bd30982b6dc9aa8e60144e0a2b174cd73c2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a03477b66ecb4d0a91f5065d0a3ce2c090a8b714995410f134da1b95dd4ed03 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8ee7153c6c996af48fcc52764207213ca9cada5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a580cb24a511ef1513a0b3ce8a04791ee670c44ff368ef59c10e3ddd8ae1bc40 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad8e3ce27ebfbcecf36b696b51ef15ebca7aef1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3182cd26ed2dcdfa24b37bb8519fb9ba273d5c6ded6f979d248da3bfaaddaa30 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82f4feebe44e16d58e0830421d7a0bb941bed0e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01d1c038efb74f98bb49d20337ef60f84cb89228b156e9bd8bd3bb3ffeb4c844 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ebd47d6178363d888b1e485f415baeb8cbad6a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eaea378658f9de7a7010ae3024f567a0bb3f597e147e270371c1a6b63eb4c23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..415f4e7aaa6e2a55132ca825fbbdebdc117d4baf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cd4d29c318bdde14cac7dfb08afd7f89d3eea29defa46b99d45719dd1a92f95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e02553dc1c14bea0ebe7e2264031f6b1c028d5d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:775860d04488ae9c661da4cb9364945af7a3ed011f6e89cd6483a05ebadad785 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fcae6c319c1d4a9aef6d8bc009ef774e57f11c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18f8cb45e4e3caab009bd0a656ff24881fe3e107b6b355338cf7dddac7495c25 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00cc23d9484a1518b7104ab811eaca77d35b9d90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6865b79c817f39f3b5b911c47a6d1a9e951f814c551f5d01fd20e2c6d4d3b194 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c1e6c958740b5248ba79dbd80dabe3c4ff92a7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ac0e5498a21d55787919bf234871b1efdef8524968f1a420a49e56d2091c951 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..414c452ad332783a2c87f11ee23cd1cfa1f02ba0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c43148be6c65fa76822e74f4cab9285e1fa9fc29ef591cd07db0f9c0c16d6ac3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06831539bf21040e5f3e2aa644558ccfd0c01fef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89ea75ec58f2648da0a1515270982f5afbca43dc6b59e1233dac10647577539c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0fab20f3a394a47c41d0a48d4aa6912432b8906 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ed6ac842a31bad50c7894cf8235d9aa8b8be5676dcfd71939e3163dba33d457 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed11b95572ea1f380d385e247858c5407f3e1220 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6196f47244ed78d5f56a61d4b57486df7f21ddf40eeb8af99f4242679b2ae3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccc51525d15c91a2a5ddcadf1a017e5fb892e9a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f702c01625a0d876560ad9af9cb033f8cc1073622b69f013b560540b74a30b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7de17853fd473010938756536d2f8a0629aa0c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d036a6a01b19bb69fc7897e6f7c4bf65e91b55b56916f51e6d91dec873c2ed51 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..314d2a7937cba58d711a6312a1f346e5dd3bb621 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e35b8dbc206f77b00085b85bbf022ec77ac10bfbad6188f8b761c5c2dcccd1e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d860530299aa02266552ad9ae31442269dba4d1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd91ad0102e3995162d8844ef47dc082bb9b98ed396bfe2f8c41b8e08a7764fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f145700e954dd45cc4f11561c63a75b9689e37ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57735f6261a8b3aa2f4379691658eb58fe1c3edd4435093728908dfee21bb764 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d744745fcdadecd151177502ff1c039f58f146b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654ced76a7432bd48aaa4d6cc0e2deb9e44f6e1afc5bf572a130fd6a264adf55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7f8e27c5d7a74828bd4f6b22996aff60008a4a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:620d578a807c7c009078d1cfe8e0c4bf1eeab33ec9bb1b6d2c6165029a6ca07e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..82af2a3967ecc1ea8856e78d566b5ace38804333 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d593f39aae3d7068bee8d388793fd8c5937d07d4ae1a36439b9d71db1f968b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e869648428f7925cf6a477182371f4fad29a9678 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2c014f5a8b5bda2cfb62218ad9bd26f1f558a1bc778db0571e11f45528e767d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f72ce07613280bc1460403eb990e5175bbe4bb1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d8a1c86126b25a0a7d5766a9144adb4a20c8d15d04fc208af275fc8d4bd1ead +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3017e4eac605468764fd9fbb47392b54a0a2c867 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:170fe9886051a4cc3dd733ffee0d19163566e007a2c34f0d1b56e0a9ab1e0acb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07eed923ea51af7214ccb96223d3a0735e52d24e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61b1855d3f0bc2f8022311432b8bd72eb41fc76679dbb8677f4c22f4aea35faa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a8ea3ff35cb8af502eb572c508ad2049b659689 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d24d1d8ec92ce50806f6656fb3fa22d0cca0f5823b5f4edce10c36dffa8e0a74 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..013f6aab87bf2657ea28c7138755c7f5f040fe0c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38fd7a1ec4907412f212fdc240b2956839183950c28e6f939e6fc3b3bb4f87a3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..60ea5f377d1757711ff1cb2a8f4573af48809891 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e1d54cf8debf6e59f2df62b8a0bcf5294a72d3196a8b9fa642d828f25ab5ff2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17ee40150387e2b1d90e20450a3e4f342e6a0db4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fcadb82aff1ddc2cabb85d28ac133085b36888a7f7c5e224abd665d95684fdb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bb80aceda2d82884d6405f02424e1937912e8fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c7ec4c4656f1e508df108f1f20673199374c6f707861fb65099491ac400245 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be5f9440cd2da2a1d59b1ed5c6b4b951d9d78c2e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf9694380d2dfc728af2dee8b65868fe199d79000e7c176dfae0f822caa8ef10 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5b2a19597ecbc8e285b25e7c07293f772378735 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a681ea964e86a01783297b0f8428ccc570c343aa6253e959925dfe637538028f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..863452d48e0cc757c2ae1627678a882146ec43d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5abbc0f77ad2a805cd68a2b3e7fbc6bb9ed04e370432f440e6f0859a1b2ac406 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..193e2786b8dbed3fb5e61dbb58439ed7bb50450f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0ed755bf974b3a312fbcba25b3d22f0c5249517c6005aebc633d69882415387 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d42b3be83e818f2f46a01a10f9fac2f298610709 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c4c863d2b05d419ecf88bdd2086679d98c20daff3cbc90e316bc1d3db650072 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ac817271303ac0bedb0805ccbb20af13f98a65f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d62f6882394282ef8315a088b355e716b99d62309739091391c821cb6df1e58 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c98ac709fb36a96a21abc4e1ae745d2b8fd3cfbd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bd90f3d4e666fe10ee3ce87fd5181c8d390eb35c091bb274e3945e2876961e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2433d4c39a3e902fb59ab7ed42a9940781b2d813 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f121e78390e3e3aacb0b8979d65a490ae0e6ff9481bd4fe455b6f276c158a7e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..56dbe1557a9b035ae278d03626f6f470a630941f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80870be08979508ba63815c346c11288600a45c81b34cebd0a40e19da52ff7e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7065b997cbdda48cb1efc9c6dea34ec3ca8fa656 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d38fb8def39463bb0d24225682fe9b74906853d3f4d996f359efe50e38c7df8c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..45438d7054695cdcb24439109a2cf12445be8a54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76cae3e18d3bb271882ef85a26671eb25b5b98d9c9477a359e2505cdd66d2f29 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3623d06cc2f6a4fc61b22874db83b7f679aaf71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5edee8db359fc04fc6228bb77fac5d6b5cb8e9bda4b121a761ee643e0fbca94c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5774eac4b20a8c1e5c690313c1020c570d34193 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c74b582b9023c2b8acb5abd287af1a16a265edaf558e7ccddc38f9eb6404a5b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e71897a0ae5401684143816950293e568146d27 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9655240db200d5f9d7d208a79b9a5e153214d314384b13de1dff49bf0eb783c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94bbdb35cc83eda732425f67e0cad546622271f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed49e92cea54238f61a4b186e95527026e14df235195b9ee3f8330a5e0a7bf64 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c26079c1583c145f765e728ddb5e0ff7919294f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31aa42400282038ecfec16fa33b68b45962281f500914bf12953ecc78d6b6b7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49f951d52bad92428ce01bafc8c5891e9f69b20b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73acd27af1691f8811de7207d4ddaba09f8056b3e6542761be4c25f41c3c2ae2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd962b0004056b31eb83f1814aacf3f700f4abcf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6b1b5795b3035ec4bacb16140c88a332d4d3f75a321be5599e548ca3b5ecdc9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9666396f933d4012d72b776cc8ea58659921c050 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f47a144522ac63808e0b78831efeb33864e611de8ccd7f6b9d13d471aae9b248 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec4d11a5e8020d7650ebec1c5c20f52092cb2563 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f592bb54f04c2b1bb84ebb700ae05b570e50182ac5908f935a67e7ff51859c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fb5541678a58ceeef56093b72841b58d001f887 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bef14f3033bbd9c39253a5bc80b4369335701ddec529591592a5146b2c7a5f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b16dc12cefe13f9343d36425571db14426199e4e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94f18432df5ea22397a80dc5f78465a1a5f8e62a06be24bec010978bbcae1e01 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b92445d17b0e0794c8ba8b066a29e51a13a3a58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efd5f1ddeca1b4b7e28fb24b2c0d7f687b119635e99145c6dfd1835adbcfd02c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b860974ad862ebafa74f48026822247e88df1f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd41ff5f7a5ba0f7e4b3220acace288afdc023ad9b88bbb6289ed522292e2818 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cac1700763d2a5f63daf61f51d180b22064d9bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f7820fd14e43366ec75afe1b23c1fff91059501faf788875ebed35c49471402 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8526f9a018d3f79441158271a17f98c0b3666ea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80973439699866c235d1a8bd5698bde10016e04b41fbfbf100465e5938469c16 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2ce52c4ff8eb2051dd1cb0481b20092a4700629 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af25311853db5c0b7ad564e2c680288d827e499fac3933f298655057740efcbd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..843f7084aba44750c9c452db7571c7786b26d062 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64475ee9007e8afe2f6a66c78514825e7055e11b0add9b9a398733ae615e2e23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a1bd63af101b6e6cb66013acef1f6a35ad6c928 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486b24aaf39fa98386c48874d4825ab4ca9669449921ddfc3bcea24aee96779a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..951950c3d702698ab626c596b4c8ba7ef9deb80c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c218b3aa7e1cf50a53b5e3e05d28b28db8c10bb092ae153d7bd93b121abca42d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b624637bfb0d5a936a0b79cdd1241b233d3f3bcd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f87a040004ec19b0c980862e36678e2408ce3f86d8255d92b6d21028aef3bb6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dee766e22eff7dbd63aa12109515cb1e3c23313 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01058bccdf5124e1cbfc547ecb22cf7bea05edb96db902ce38ff65aae7478c2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc16a49da5a7d90e3d906e78ace37aa1bfe42113 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23ae20b3233a8173220f1cc385c0a8bc28387a5895c866302409fed85c598fa3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bcdecd271682b99495dcc50677c3230eae90d8a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cb1b06d7db4c020f14741664db5d66f519ee8391b5b3a14d08086200ce77675 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d84767310d47d1d2f04eec128868fcec4923f455 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b20804415b1d25fb6e4a9ab11bc0b0aed2cf074aea1349e52511e71f98ba5d81 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d64707914783d5f56927bc3c2ebb0221109aebe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4439789829fa5ec6c8ee8de00258ff83d4b793b617dd578f41717580a03ab47 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2a22c97a79eba548fa587cf94dc88a3026cd878 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b366ae8edd061d701a11039fb15e782f338142beb613d098b423e2b1d1b23fd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2fe66688c8bdf1b4d0309727d318b5cfeb39f7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c625607f166767a49b1d517c0f23078821157c3903d5442e2f9bd515af9ef870 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7047b82203f232aa48e783047ea657be2e6432b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d3ad10a5af20183075b474e372a3fbbdb481ca951048cf9b221ff273c555cd9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef38bbabae8782f6759baa9f86b83f94be530ff0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b3b7bb74c7a7d49261f549126624f24d6dd2506557100472d766d8a57107a60 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da96278e50a5d73e6442af8509141091b154b08b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecccb407480b9ff1d5c148e81ce3a315d48984fbc2b86a63da78d20c5e87e697 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb11582fb8dc189a9dba4013d1462cfd183824c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f2cee555371ba5a2da37dd50890bd46efa3fbdc12b8e0f764cbd5299d04fe59 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08cf7835ed7b8f9c5712ebdcec827bede7c2fe33 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f411a5c700f8e7869edb212bb906be9f3c4f96c5fc2f7e2b86a9480afb6281fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08c0aaf7e588e277eddafd7fa421c0acb6ae6b2a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5569804aa1a9bd9b53202f6b432884278861b4117679685f663adc0bf08c0aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40ab9882c95be123ee82dd684421b0242162ffaf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e516993abb4bed56d4d748000c4fea7baeb43f8a7112be200e16c2553495dfe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b01dee2782d87a520ec5b51955dccbce166991f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4989f8a0d211913f22064729a7b950dcf4b82be67d360e1882f76bf2ae0326bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e555cedd83dec99d59d9626d0678a252111e904 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52ecd3ac984cf1d961d4824101a842e0b8ecb17a9fc4dddf7e2cbad6e3f9e447 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34882d7b99a05c0209260ac8ba7efca1015b8f86 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4797649514a4ce508af1c984e5988b8f90984f5a49da2f8f627aecd3e8aeb71 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0a29ccf9f4d138f8b0fbaddedb8918689dcb7c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:445e2ee1fba6fba623b0cc555c29cec0d76b405d9f00e2166565a74c1d8ea686 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..971902dccfb7731d5b9b5f3f88a6d3cd4335bd15 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a460a10d41e0b6bab3548b281c715378251c594f0509731cad50ad6fea74938e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b57a237529ed5a7036845379fc21670121fac4cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556502e136db47e889fd7cb9d2fee5cf4e69456ebef94a2c57a6d312fd19da70 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf8446bfe0e113e8f52750ab4aa5eefa36b17534 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d59f0956fc703ac9c66aa268a7c4251a9a79308d735280302c9734526ea82c7b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8b4f414e80efa1dc9aefa76a37581d843b78f32 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb5f23546575b897d22048021313af45d2d013995b39eb180e850071a941429e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bb2da3dc994d9b266c9aef6de862816c39e8df1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b0fac765f4bedd75057a916dba3e88e462ff6598f29425787351d40094c8933 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d3e9709dad6349d9d9b97ad0ee7e72464669c78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f931e780902112d5f57f04e04ab1f9a00861dd7974d79d38169449c2f6d978 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4850cb67b391e4536a1a245ea9414642f6b64ad3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f07d29e90684e80eed3aa14b20d856c26e1e9e65925bb1eb76bb29eb3356d919 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b095b3ad36a2a4c122b43b58896b717d585dda78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91ea169721520392971b9614e3fb88d5aa7a62e6d381e1265afb96bc8a032eb3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbec1a7cb92a34547f64c907ba97fb06fd16142f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f351dad523a2987e6f98e59c46ecda7cbb65b87cff90a00e25cd1485c645a226 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b493a1569cddec3e1e8761e0cd96d35424206ad1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c217bfda44d743b70d9fbd1fe80e46959f0c7de955ea446424eb9f0e983a2d6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db29439d55b06ae28791dc6453f1c1ebe63e371c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53bd2af83692311ff199eb5d6344dc2f3bd2bd33f29ed006aa30a9f86c8e694e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fb8bef4a8d2b937b723f79f3547522d2da73dbd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54705fedb2396666ac06e0026eb84336d37108d7f191c8265b404d7fc81d4226 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9649a0577d4aae8e49aefe40e9348934da37ac96 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b82393f877276e39830bd06cd5b34d090a650b4e6ad1d853dc557be044280171 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..398a5e5eb90dcf16713977d624225dbf5e31b611 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7356bf4cfd0a72c4e08255314ab3270d41dba086420d5638297f6ab22ab8708e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa84b82bcf13f3ef55ed841466cb03b4156d00c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f3fee5e6d3a055830c3b1b9e3478de4620a7df44d4d35fd6f5ce6f384d98fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47e843c2de1279e716b535c1f021b4967aa9bcc4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb596c145021ff307f4578ffe182abcd08e3384450e5780bd88fa53a0a511b83 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ab6f9ac829d91bba110b5f85b6f7107c10f0af9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa832737128accf9a329835a4b3c03ebdd29f99ef53adb499324086ad2b1095b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bef47a6047f7e3d78acfd1e669dfc68904b4f1ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60aea1c3e2012c5cf527215b42104d7e64e2a827df2a491c42953a4206778a26 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0de85a662efbc106c013512eb77d5fd392b76a41 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df7b6ee8ff58bd7b4108951a3255358b7be5f71f7b01a4b5b4ccb52094a6e12e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58802da96eb6134065f99ee9ed1484c524a7f323 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecdbcf77f73aaf8bacfcc721322160750946b927766a0e346797a874adfd4ad0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c35543d96a698214b0cf27ea7d06176088bcd869 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b136fa1dad28b15c65ac67abc0d95716f037d40d3091963ca4f9aa53878fd2b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c513b381896ec976406b2c4bb64b36b85cf9c663 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ba2df9c1aa987ab854bf5b8fa63f5cbf71ea642a734e397de6bd940d21d149 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42eff0a5519c0264e490b1d08db18d715501ef62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdf40467255ee88bc5bfe2007bc67f30ed5e5400b354596a45b028b738acad45 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a39b64d317c0504a70795345f72fd41268d9f54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ff55c2c464fd79153dccb93ebc2082bee1ccca5f4a355a8a7c9a4630d6c778e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73d920593771996ee54cdcd8cef62b4da66ed7d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486da18cd4b7b87b11d5c133c3fb49fe1efc6311415698bc017bc92d27098419 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0a69f28e8a49c7fc39fdb31100e70490b617e7c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b3c7c49b107bf23c3536c68f5738103467bf41b033bf10257a884cb6594e67b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b1df5235a0b194ca63ccfe97d69baf924c56f66 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa9ae45b0ccdb819210627fd697f190c6f16698479bc46554d6595ecdb03a6a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64e6718e32f8805ad6ef33f9e8d5fe48e35198fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:498da100beac139c1a0d72c2d98efdbee8fad7b4c50097079e05b9edc7f6c413 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..629c4da3e47335c41a1106be837154da81273969 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f03925e7dc56eeacb02e8113bbb2ad8842ecd0b29fc947eba628c259bda70b00 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..633577e7606aa5015edb8a06e6fdfd40ffebdda9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fa7be94638565879d0e3254bfb99ce3f62b58d54596587a10cdb4bdbd6d3573 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bf03bf39b853f89105dc3517679d167fa7a8280 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d5424007598d0ab88f87fe088e3dd1176edae0e30da5d19378faa60192ff0a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ec9e21128e6c778bf7c82ab1b4cf8517eaae9cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2f96b74f151d729462b0030ea78748a8a9923322cdca9db52c2f37fed626e3f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..afaa357f3b47dba6633bd7bf8848d70ee1067be8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc86dba4538765f2a95e8e767778cce99a4d89f2c5ca59d2a11f2e5ac50761be +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..719f7450ef25858c102343f1ef893ceaeb38ac0f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dcd6f0fde51ed5d167b300901e83d436582fd203325fbdd722abe00d96dd24b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..822ed8b7e546806b1e9d2c9201ec4ee2d513ef36 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27cccd514f35121dbd6bdd3c25092def0ce7a7e6adb901f999a6b99cb55a27fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0186bade4d5d6e5f4ff5463ce71fcfefcd35a647 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:598b9125440a468d04d2fb061c39b621d61dd2a1fa5c4711c7cf607fceb0cefa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b003839bd3571ba2a616cdcad0547c7fe4e25e4e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba9da69b13f82810863b5fb4d0788827dc9211dca914bf9aa1429d4d412a9873 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2fa56b011ff907121e3a5d1d227a8395e1bae5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aa43d90762b0f2d85661167d48093a62cb680f855879ed0605960c0092ffbe2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dab49dd2b237dab72573a87826a5db5e0d1d00e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21eb8c82e3fb269b82f1a34fb4bcd8d72a0a104800be94c6042140d029ae9225 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90badcabfaebc7e1c9c1e4665270ea472900ce36 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3acf6d0dc9babbd2f5c8232ffabeead37bc86e97d20b629386ff2698d49beb3b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a3eda49c3646b4c8563fcac31969a4d9a82ff68 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e731976e0424c2442a9be780ae8006410a533abc2de245f83c9be12ae0cb0cb2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80e650c67c4cdb983f2425aaee706e032a69550e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:936f0cde789d3dfd1b5ed85e9c462327bf67cb1bc86ac8df1753899e80bd829a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64ee4a5aa2827cdced54fa10a6f7083a939d82d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fd9bfe48f1706f1754c2ee9cfc80fac63ca55a916dff686c8f5239bebbc1625 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..964737233e31e68228e909663f76de069e979685 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621511f5e30e13cf1f299a621facc5efdf5b3e6626895bcd2d189d0f13e379d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c247653a15da991ce8aa7031aa21a056a83834b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5de572b4e6f630cc2e462099c91fa1f5bb6aadb8fe5d42afa88b829510464b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f15fcef031ca789a8965795e3b9b9d0d8f58b0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f68050fc0ac25089a6c23bc3b708c5c72c9a78b134cf4735d8f5a1a37e3a9ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98a4d18bfc8af4eacc4face39439770b0dcff90d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08daf530430902048d7119e65b17512c509d9f08b460bf2075291bb79d4de7cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a75a9b9feb0354e0fc30326798124ab513116684 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eeda58b32e31944cdefa2fa8a0bed498499ef0fe610c3dea0a0ca09824e278c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c88225e7ecc7692f5d95de791ae5695c8d15e5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04876e326f659d391ed2eb86c1e4dac81acdcb01ea6bb576ac6a59a3cef2de64 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52e3ae7e11fa39bcb697038d39defd2b58b0d382 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe5d64b473fe27442b5a8eb3fe38bbc4e958b35c9edd80462ccc029c601b89fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21aef6057df2e8c85c3d2fb055959587ef74d310 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f0d4331d42a2ac4f9e0b5f7f1179ccda3cf378d1f064d030aafde4354b3c20 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a62a42d02ea72e0651d0778ed2be821e699966c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dda48646a6ab6aabb353c2eaa893a5b4633ee02934ae23de09145cab17914d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a08265217c71186e918a6d840ac51cc6fd99077b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a6ed585dbd3f807957815d69d21d2c0b20059d488a65d7c35c32609a7e87b1f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fafcd49a776ff06216f58f8f44bf7b131c98795 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e592869a406b7bd066bbbe0835b7b4b0d53df2518e6741236fc6f65af4d5ec7e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..976ab488ad0e16998ed1cd5b5042009444c50da0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e041f25b31bcee81832c7dacf424a7559184912ecd2169fdc2e562404716178a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9703de19ecf05bfb1d87a27e2096f2477e10d5c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f57eb01d107ad1c41291b235ad605682e4c5bc23e527ebdf656406b8efe0bf2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79eaba8f4723a80bd2027a0d2a116a1971574299 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6755e4f1ebd241a4cbf10e058addac9ea1ed7c2d6814a3a891cec43a5015f5a2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45b391249cf43486d8d91906f1cd739e4087c972 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95b2df7244557c726f6ed41fffd89e50439f19a04793482e20056163e4f01eb5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1222ca489bcda6221d61dc13f99027734f377c93 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7022f6cc9764af472ab5c32971fe9fb59e01e22046daaba6091cc00636277c12 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..903bcb2823b519c1f5ed97a4f5484eafeadb41c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:565cd39f53a94494df4f5d8400c316ff8c45b87087344de15f0daa3cbf20174e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..054435e2619b4023aeca016fbb9f855d48aba8fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ec39e9200d74dc7c265dbc34665420bdbbf6b510b83c643dd407044397c9ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b93434654e74b2fd92d44974d23797d82b5be89 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45c4d85fe299dbb00a7ee23fe5c743c1da701a0a2cdcf795d48e2edce384115d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c06ab4bc6db7b811d907a8e56ed30b3b58889a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f9190fa1d2ffcca1d2b514071a4a78b23e570b63cb6c2a803e28ced1401fbc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65e6187c4bbd10006328e296b3fdab1474acf568 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:697a361a0768c9318701959f890b24baf387bf2ef3c69ebf89ad46b875c926fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..176481b0c8996bcb93d2e4a4e5f2daa0dee828f1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20fee9f34964ee0659c7b49be68fe63b2da3297f9a8ed33dec4cd7199f15337c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..872da767dab93c8f96361af2d05bbad6690282d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c746ba13bf992163a098783ad157fa4efba86217d87ffb6a2c1b0f4889c64b95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cce508a310cc280be024362205855f44975d2e81 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c5ddb39f740bd1da546f5761b01c41e9f7fe927eeaa1ee5c0c3deeabaadee1a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0a303e6ca128a11f2139532be19daca8475c465 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bf4853390c92426b2245017c74b5fa3604212827f7e8ea24d6a05c8da003558 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fb997abdd0825a9ed47f2a718806ac9b7b71515 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a648188f229f569fa949ab7f6738b3293b059c893046aed6ced442d4c509b22 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a5f8a4fb49c07a4e64aacbfa409598d45fb1dbd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb21fd7bfb6cf8d6a69dc56d393cd292675601e580a825e0d839fa6f72b4ea84 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fd21050c6c3b4ed1e2404916175cedf7fe6963d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbc2764c00b1c5ff3d247ef2851ab592624910637d70f15140d677d633a5d42c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b055324b93a381ec0288b277382fa77418043dc5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c73cbe96171b5951e51575d6d79f2e5c09b237b80a51413cdb50f6aac143bc0f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e25796940c30778dc0b7b6e02b0903ca1bd86307 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a4cfb940857276f03786cc541ee8cde42731559503642d62ab3a1e656163942 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7440948df67ea9ea4d1e119e66b2daba8bc2b65 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b04a75075b9e57abc58f89a54ee3fc906fb14f857925eddc2ac4dcd5283678dd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dae2cfc42b97c677d40d7c4d49e72dc03308a600 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fc1f4143144cea3099e2f00c8ed90193df39ef2d7a6e5e1c2af9d6ebd5f7b0c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..848f6673278efe6c65fa88291b4cb8ce5be72ac7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31c53679516d3ebbc4c57a445432b83c7fa0deb1151601a7633f32f6429cda62 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b956bef47f184d7922c7d94cfd17b5d90593104 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfbaf4222fa0461b73fa844ec6d168848c2f6077a046ccffcea5dc478cd1e93d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59a2e9f926f1728845b3167b15d8e76bed93bcdf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f0611dca62211e9e8a177357861f587edad74e526e2e71beba1bd1a8ceea0ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eca0e46402251fa8129a12bbd3a4c33eaf3845a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1629c199ed97407e4e25706dd5a01baf0e6ec6a1556c1000a2f197beab3ce810 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5116b65ecd7078fc0dff7a6efd8499bd04dc0d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a353ac283795e726ef65ead73f5cd1ff242a0ffb26c00ac84dac8cac88415c97 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..35c3e390982d2bc55c4361cdf75bc3f970fe400a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c769d93ae64ab356d6eccacd133d99e98bc213ad0df819360e944f2beae939d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..daf966d5806fef8f7dc7c5f6b0791eeeb39d5031 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c57a21b3903ef1bbe92e71428461ff5fa24938d8989d441391679eb75ee840f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..72e6560e05aaa6dca6a11e2ac3e05745a5804bca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d68876415fc91c43f2ee035d2aee8ee6d6bf9acfc99728d76c04b7b176aa2667 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d724c633ab35eb4bfab62cd6cc3248d44b3501b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25451963017a06080512b8eb5f28496e39198c8318b161c926994e26c56a5003 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf223c4914331a1fd8e702fabb76d860c396585 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c362743963d0bef1bc3cfb3c1d92430828f58bafe58eb501e0abf6be03e281a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae3c455d74d4f0e1f2770cebc7217f6e26d66c47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21642a2f4c4e905b1192d2bce8423e0bcca8a477d580c8f4463feac714e2617b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed77b190ba828ac4bcebe5bb09063cfc7710b53c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28625842cd83d7588eccfc11dacc7fea7b2b4893ecb5b866724b0d706a6bc96e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba849ead15704685d9d6991fcf248426f9281647 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d9f67268ea4dcb50e497a4e49c5c1213b4e9ffceb7b5ac2e15ae0caff18592 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ae2dda0cc6d426562c5915399f3778153438aab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad7436ac0548bb8d27e3634135e0a4a5dec6cd7b3d57499ffe9f1399f5778924 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dc95e5e39e6ce7ba20e4755862faa9d1a552c93 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de81b02dddfa41afac288f6946573ddd9af0392aa4bdf1fe14ec3d62be2a04b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed5462a57d6168a4bbe097fb9639ff3185a6020 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bdf539cc9e51bbcb56fd997140e8fa91b2e24785ecf449f7c374e395c17d4a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d4169616a7dd50712503239639aca0048261fe9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1591bbf20fe20e104d3de6c128fc5a24b2c8781c41e9d69de25010df74d3563b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5539e08961890eeeef9b82a3c107da6fc104a91 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f188dd34acf74a39733c789763caa7f55218df34929867f1255e9ee9e17e1f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0f3a7e9756ff723d2f80513d2339ef79f1b225d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071baca15be819431e252eeff1b0226a083d9efbfb6171c8b22c25356de4037e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29863f22f7deb92cbf28a933840a5fedb486d463 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c447ae12331c084d2e91cfe7be2e5a95e5bb566e710ed4c77d0dd24c252ca45 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..563564a80b7ca13495796d4e46365318350be171 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30cbc0b365440476968587ab92aab84ba74bcafb2022bbc1ce8dd32aef995d27 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10514b49a93a5efa808928c7fd10a8c1c29a345c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:635592ad0e0635c5e45754730996f062b8400a5d134c266fb66d9cf71f1c21a3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ca01dce178418320e4a458a2827413ad5bc1c13 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2d50557831e899a04fff4fb2e37c1a642fc0d86873ba156f041ee2a689c8dd5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9e32d21215c3eb95521a05fa5eb84a61c4ab47f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:984ffce833515502667c3af2869b4a5aefc83530845c11cd50d37e24274cab9f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0347c65d1bdaccbe20fe5fc48a110cdab555e36e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7801b319a9bc1437a33e890709aab81f5a3ffd774403c355591e0b87b75ec92d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0790505632cf21ad2865ec75d90fb64069e1f73b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6279f3a20d1b483de59b0b46875822feb9c5f7a8ca59b19c4e1a94226dfc39a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6001abda2bfc717d57acf5dc4d14c9ed2b23eba0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5a3fbf9681ab67c5bba8e377ccedda085a6a78d36af74c97ce52a4f2245a28d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7e0d26e1c112cde81cbd6f7de1dbc8ebc6f1a63 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d89672e33c2d54eda4a15b89cc870e3d37ead2f89c64fb86ece2de95cf5758 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6158ab312cb53029230dcd29806d6487d47ef2c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8fbe387ea90cf8394dab4c737e9a9cfb275bbf99ca9fa4d0b2850d998b1913f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4291a1029b1bfcc198d5307e42814fb383d9906 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3165de6ab5ef7d1f70c1b2d96a811a8de5bd9b84947889b06169a1ae8dae2b99 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ed494f2f4fe24d6694a39ba960aeab831471944 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a49b5dbfe271cae34763d85b75a83a3bad5a1d28de822cb0b43759b308d58420 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..42c902abf25efcac6a92bc2b73cf96e3238a043f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73eedef00b9812fe5efd6f3d8f4454b53333826a72a6bedbfc2c88d5f3c4d599 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..512da738bba78ca586898d0727cddaad7475daaa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf4685469d19377115e940ce187585556b03b9a3c02adccdd346a39199288d05 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da895b7c6b38d5f19e5eabdcf461f463e1aa7eb5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c2693e730680dc78cc82a27a59a3c1579b0519cbea4deea7452a328662c266e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31a1c95296af4dfb8f37c64ac6d71e3782a0d903 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bc3d5c3f7e9fae26a82a76c37e73a0b1a129378b29daadfb7907ce1ae01732f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e66c54bae097e0e579a67675e7948d2c6e3a3840 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab46acc7b11960fb5b72dcd801ddbe59ee1c172cd46bd73f5872390438c86dc5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..779f33e85547345362321e9eb86f60b4ac14bfbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409cf10f6210b1cca653a6bcc48b40825527c53e356d06d4b0248b71f39794bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..255ca3c951e25678cdd0d09efe3996f189de2761 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dc64e62bef9d8fc6848de7a8e1718121b8509a56eed645edfb79620627ac49b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ccc34a3dd7929f214fde7f71a53ab05cf66d993 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12607dee627b7ceb61914526fe21d4473be89f1a1c4f465d8f6363f18ad45107 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e599432667fcd7060df49e59d5e7329beca2c16c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51c23b6302e7ac301e02362d55a08d333a897c9f9a0f88ac674bf20dfd0c0ecb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fd34095a260894f7f715ebfc8f988a26ea80a51 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf0d555f4db65006c240ef5e28aae8e1437c2f48ecbc53870927d5d96f443741 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e81f6e2c28b59a4f6b9b14aeed86d4844f09d5ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd3b8c08d490be531eb31c1e8f01158940c22e8ccf65d7e33d73e91975bc7c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..304d13c9dec0e7e8482dc83c0ff4d8c017f56d38 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30cba9b96c188964e75a4b7fa64d6df1a6fe70824c695c02b2a2c031c81df2ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cc44d82626412f4f3373a2f7e93c1101ddfc904 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4536da5fa48dce4ebdf61b7587fd02e759f3ba693abca5c4553cb273fa49089 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..423d56f3d7ca334493f18e2b0e10bcf66071ba6a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8fe460b3ac1299f5613bd6c06d27df207b4a0eebdcadd617528b9a9b832dd83 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..beea00ad66a9997a4786f64acdc41065b62e7cc2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:781c672e549b2114ef41c05659219df9f6ccbae957f3a76271a0a7713e6f7c78 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2de39c7b97cd37e1cb09b1b8c1ce1322f85425c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b84ede4354774a34e5ef25fb2203c43fd18ca3ec67ecc9def741a2ba44395b92 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b014a83d3ee111685ce5c282d30bb34214ad765 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:815f532c8fc2348a36b83922d33c8217380fd82c0ab7e97356c73f6da5a86933 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f342270c342e69a052d1f2c6911c53a58dc40c7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdb4bbef54f36aa888397731ff8d7f2c2048b70de234ed632319e44d8a619cd8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b407f61f99ccfd25e21f6551288cc0cc84cfd1fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caaf578791573b0dd872f5be70957b7314ef8afbb320f7a86f6085f78840af52 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0228c6e1abde0fdfa6354f514b9e0b06a87a23cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32f4293479a308bcda8507b0a5d740dc18b57b49454c126cd325d0a0b2e2b354 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..73a108606f07c0286958354e51bc823ab1d05f99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:236d5739c54f7387b5557d61e172c8b9f10169c37e4706f9ef3435c03f050cb0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3ef8665cc2eaf712ecd185b8b6501a6b3a7292a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94dc69fc0dba53622e5c9c52fceb00c4a0f8c46b8bc77ce6a37defb6a152e72 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4f75935de3e1d4fc0d4f69630e8151817a82be7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7d46dfc66af242e401992bad77557c0513e3e6edfc06ac2d4370a0129114f7a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fdb2d87b1f749636ef66092f26514c587e980d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:400a8cf33db8b44f9b25cc425290a73c6e3b9240c1617219188d902526020d51 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29d24cf4fd6fcbb0b99779d3633d63ceb8806674 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dbce45c9d9ccdb7eb76a210949383a4d878ab03ced9527bbe266bdee4efaa81 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3309c8659a2fd500d7983ce1fb92d27227eaadf1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4613696b8795d4db75a8b97ff7d9b588fb25d24ade98ae482f76c88200748a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2304af0f9a8b0b968efeaf6151752e2fb143681f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4644a7cccb82f552e2aff7706613995a02a9a22a6056c0cc78d5fd894bf435f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffa755be5d48d62a04d9ac8742b99f6dbb971276 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c16785074c35cc4121e28ee7f1fa7dadf3561cf56abe79b060b7ce039b22a02 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05c26d5361e5886b359b783f5ea3e291e5f0ef68 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:315b1b4adb0631eea7dc823182aeffa1b9b5363092eaedc4933592c0d637b984 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d48d61a8f61ab04dd0dadf4c314c1f8498e713a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:296e811ae83ea4e7f9d46bc3fd8845c7367fd499b094fb813805b1118b384891 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fca1fcf09173b3295a858bb8510012e6d0dec02d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a747ae46bdbcf1bee12a5291ce6354fda49e993c98a8c18115f1ee398b5b5288 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b290e8ca06840957424e6b1bd3afd46a6b0e38c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bd50666cf5370a8e88af40a0dfe0172dc69cbfab86fb08625c0b75ceec45955 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44676d33804b203eef63637d87790e05c1e4ad37 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db8a145ed914df4ebe34e17e31207000756ec7f25a466126a4d88609e96a5be1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ff11819beab237c4ba7d496ea71d3e9dc1f6473 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cff5d6cb461fabf4a5d7d6016c9f6bae120ff54a8e4d6ce4fa47a3168453a327 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d910048962efa6cc20ec79d363c30090d645351 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58e190aa20d15c85fd6b7ade2141c3e99b176ff7669860889e41a763f88d4f0c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5315ee0a1d2971ad2f3b691c4c8a6b817671f4ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b96191e81bf2a734bb1a1c65a43ea87240ff74d8a4b883c34196496703ab4a18 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c46be18be26c3e0ddddd3f131a5c9c12647962f1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1bd3850d6adace044f1ede3a38276a79aba7294f2299f82b507e4ab093dfcf3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ba625cd46914f45741c9ca9af9b2a0b332305ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12891cc6e13991ff7cf45254bf974c72554adbaea6e07061ba0ce43c0c0f4edd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..01248c67a9c0aaf93d09db68dc87dea9ae805107 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42462b8454700025ff30af5fe682047f167b3b0cf9ab1b117865e4a42caecb80 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbc428fcefdf8075c76d87f81a6fc12dfc6acc98 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e0680a77398c206277a861952d8add4937f6faadf6a53c8e1bdca3891226db4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7923ba427bdb0b682ee8d944004a3a1788c49c67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d785fedab77f9b582a0a52ceb87f04feb4d420366ab4996d4b8e7e2434c43ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b0de0f751052b3adc9128d4a4ec633be82cb9fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e02c15cb68f0ae800e33e48fd5f4157c3df03357ce3473534fe90ebc9663a850 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28d2e77a007054f9fbb3bb1a582cee066c7a5646 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c54ffbb785574b1867212fc8f8f549643310055fd1561a9cc1e606b1649ced14 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2aea84edc4ac54fa8e32ee5ed82be8b668813f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:034bfec531483bb1043fcda971cc7329b07231ff1b9d715a87f2c98b167f4ac2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a7bb318ee30a04462c681c27244a71ce35b5e19 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:557d20592c617e72fece488dda77ec37f2d1625e205322542e670f88c51a0d79 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27ed4a0d5008201c397aca7ad11bf9be2c1526c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12bf31dcb0380411b116f2e6ecfc87f13f36ee94501237e60e4484f4afaf4ac1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f0f04a9cbbbfef24dc0107c9a6d047644aa1f42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a62cc401ec2cbee17e19179c81dc049536794169f067100e7b3fa8f1b786b1fa +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63aa71d3cbb057b687bf36893c33f89ba6985350 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c765f1b33ed666251b208e15d8322f38dd27a0814080ba4a0b5a4341f6d6a74b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52f9402c06a986164a0ae8f12e40457f63a72a52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e154be222a081e9b85ea87448dd0028d7efa7602892325bcd5bba534874cbc4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8893de5617f3265e23177d479a9d4552c1dd26e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82f01d6b7e8fde221513c8d29e155dd31c91b73b2253914d3a6c70793628a0d6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf694467cddd0599a2b014221ae4f47273dfa5e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:762c04a422bf5b51e6b16fbebb25affeb6dd212ae25a068799cb5d3b969e4ad5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..90cba7466ea08b04ef6b5b1c6f83986d11425709 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f3e605c91ab6dd7058cbd471f37f4563083650b6fac70fbdc3ad8cfd29ad75a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a8568fabefe16d055c938d2181fe0c4f08335eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89f516e4d6a9b2da7b40b0266bdef0df190d9f7cbf42a880e94e636fc2912a25 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ac973ac5ff906485b3f6901f622dcc72128448a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88b657b4b8d5be390c029ac45ba982132ceff67ce4601840cbb797f1d84bfc33 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b636d1f53fabdbb7ce9aaa2873810568bf039ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9afa215774fde57e64ee7ee35bd7c5350bfdd7f0facda3fc2784ad8a636716b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..375d394e6ca00ef63e5fb38865e83d1c581f8b60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b2c0c51233763b6337b89096b4abf7e87da7b88c0be8839291cd39d4acb42c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b308c96e8e16d77cff2c6878bad8184f7bebfe7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b00908d14f8c382d5056b8dc0677a07772554149521ee91dcdd2045442866ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4aa91591c4cdd55a8ec757bb1a13e9af0525a637 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74baf0dabe1ceaf87eb378d24f83add62ddf9121ab6d59d5cfefcf57d51ab7d6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..609aec176c1f47b9d8bb2b5201d32f8ff4bd5268 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64c0ede400f01c4ffd640ea7b166b4d6a46360870927de94841adc8ec44d269b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aac4a158c0cea686043e60808de2a18676cce53c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88e674aa4d36948c4a10b495d2e21a448d1811a220ecafa3ad38824f44b053ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..16616f90dbc7b8ba9e08872455e6308e07c7602b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a23c188210b962b104b512ec021ee9194b05467031a33efa7e0d39893041582a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d6538a3019b93d0427b852dd40bf0a4b4389637 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3b102c74396469bc865cdd81420afb60b2a3636613c7f52e98f871f5d9f24e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b71734b2fe1396d0f84abdcec99e70d546c0126 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5fb2b94dc9a2b158621e1949ad0c3e60bf585bce1e4b32812d2713bc9ddb661 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bee0002fa5f2c84555a45022c763e5ed447e636 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f53c3ddfbdc4bf4795586393e6dad0bef04e420c4b904743e0bbd26ccc85852 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70855d897e25dfd8128acb9ac173286a48fd0b16 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e79f0f8f128a99341f9c003cde537ffd8b7c329e4bf13979cf12c2022250838 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a253b8a7b011b2585600a8991e97276e01055669 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5d91c39aeccada195523c4cc8f5d7365dbaab09e31ff354be721bbc31e9354c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a1c3e72488514881096e313f9bec0e8f964b8bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75f21a2ec76a0d2117e69a754273bb3960ac2ca0acabc2de40d77bfc12031a55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d65f4cbf04af0292c0cb3baba0182d77875b2879 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af19476952ccdcf6874cdbcc51ec3438d158f36870c5c25ad7e6cdfcc34cae2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d57730ad4bfa630ca5b05eb240022477c7e0945 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db7d3c2d7fe52afe22c99b68db364b7abe8534598781fd57306c33f24bcf4c87 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53d61cd7bf382ab46b3c22520d5201b94906a24f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df68ee9540ff87eb55bf87ded4d31a5ad020dd6648cf3e3a0d1e2d135010fcb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8863a88d5bf7368027db3cb8f73c58a4847a56a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e551e7cb457c91cd19b59abd3e71be773d650a896ba7d116e4ae46feaf81db0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb531cec6269f9b0dc0835d0e2a6747bcf68f3e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486fd04c7e4e4752eb16ed2eb3e5b229bf74551e293cce0e579edb2b6e2e5db8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf6e545801396b582fbc62c926ba506dbb76d0f7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc8eccf0f408288ba7cff9b6a1a23198d5ccd89792cb72ee5c692129f2f3bdf6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11986e54a90cab5106474f37f1ca833bd5843699 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e877fcc201d28fc0bd33a51d11caa750c4b9304540bace42e46c77a139ade40b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f01a88e16ed3ea9e7873ed4b1eaef0c96e55c6a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6bf8310a95be588704202429c5940d2826713ee0493fd8322dc918900702ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c81ad9d021ffd67f5f0914a8f2950f48231dd27e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c66cd5208242a03f3e894c7045ce880d32421920b0a17b32a47b111dbe1146 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..342e7a42b88a567439283370fb436ce5ea4159b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dad40921871e0722289e3babbb141ddb0f399a15b708a42a5a1cc2562a53d167 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbb1d97e40264d39ccf1bbdba4ce7e4ab19b9a12 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3716edaf75cbe9deb5f022c1383c1ca674b14c07a65ceea07ea7f88b9a9c73ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a92dc4042d808f1a9591a0b569fe692348502622 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d8b7c97166f80546d9dc9e3e9c0900aa99e105fc9cd0c171531194ae271053d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..952eb90681f1b5a622ed775f0c6fc7d7a1aaad77 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f915bb469a3e141de07f43023e5c368028baab593aaa8d4100dedce5c9955d73 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d7c097dc317512bfbd5ab7e9d82c67b6195796d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd757e361f914edddf85f8c509b966652396ddbb17a5b9fc46f364f7a62320a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4548af3579588c25e1d010cef6631db3efba8d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b023494f3af4f23523f81ad857907a4149551b2e39215fb1110fd264dbb7ac94 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd24735803842062cd68dd00730f1583b0d8ef9a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a28153010b8e3e34df75a24ec2fe6e0abd2b0adc0718d8199eb99ab1b55cbedb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb66f4edb13d6a7f804cd95efd52b5c4abbd8fb9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe736f8fdc19f3e6b6f8afc642bf1abb4b3870bd59cd8813c53284dab6bc8b9f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9d043eeb3a4ec04eefef4f03df3ddc0b9bc4217 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24c78338ffe77573844c4f799a147e6accc4e1e2a957f36d81c79c62dbacdeca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7e452f4ee4667805483dfcea644bd82473edd32 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdc6b70428f154eac73ba5e37872e27e12a9a4a60b0e6a9c499e67e76fb8a561 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..20595981a2582c0dd3681e40c9354361f081d013 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc27ed3dd874f01e47da4816c058f72b03257e9b4b8f0f91178c1e394dd25cd0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00d82c01e1c73297aa65881ed844ee9503424b29 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd2f88a0325151bd4a194c2814dcdb9c9c28df0860e5193bc2442fa7f7336514 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf0a7f0f16cb4700ffa3c01b21ec9a42fb98b4db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abefeb5f46beecb8abf96d6ea4795640b28c9ab2bcf4ab3bb009b908e012d175 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..455010f58016d6c64af5d59f4ce798029a9531c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96c0773cd57c3b862c2011d45875d6ed63aaeec42661d0d112b43898d5cf5e4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92fb3774ef5d72a4e2bd5356495f6dc3a3d231a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32c302d4c3336a8c47498676e9923b4ff5d746f0b50fb8b398d91c919677057b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..777715cd6f04be486db7efecf5ca9bc4d44cf4ea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:501eb0898321d755fa4434f0a199968fd9b20135bbefcf64caac8d3bac20c604 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3a70906dd44f46957bd7b94d6fbe3f7a3f12bed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fce6f600fb1690a5072ca52fa485fdb6c4bbfe0f50e92e68d92bda184571ade +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52da60b1e251c75bd60527722e93ec679f5aac56 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2cc9ec4a871421dedbe67e1b8236463c2aa779571646015dd2184c21ef491b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8116f8b264ebe9efcbf43e46f604cdf3cfceed63 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a8e6498d6e8e969854debf100ea3e0778b57ca697f02b1b844d5fb191b30a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4c79efa98df8fd181d01334e0d05af65f7b3d27 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f604b186f13d47cb1877c12a37f9c5f9ceb5f3d73aa7aa40d97cc906fdbd50 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a75870e6f24b507e40adf709d44838ad81d53d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cc90cef35455a1520b38685e894025f05f95ce6444222ef1f24265fcc80721b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06d96fc21cfc8af4c565482e426da6ae4df60f80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc2c62ee69b52cc7e4a3709623d0591fe4f3e53a036177161e18c43525e9229 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb7ffb6503f366d39c0b4a7d1c65bacce80d5e5b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adbd551f011527ea2a9662e35400f82e7c30878dfe47da0364affdea0ab8bde3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff76742fd3ee83dab7ffb751ebb99ab66568048a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2df30d7ef07c12aea2cc1c12bde0e922e6b5273023332547bda837a2a6a0e7e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be3b80ef559cc947eb799518aabed7bf8caf2b99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff1e9ab0e4a729ea9a7e0a0e6c8be892b0a4b007f29193ccf4061a7d6a6a4a77 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f208135249737db5da606170a20783b4cda4235 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:645047f57abac43d8d993e1e1a2df86ba20a4a220024a11be907b15cd670b7ab +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88a950fcca9cf6c1fe88a0eeea863b25b46646a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db23207cff4bf477a81907f1bfa4cd4f8df1cf994a7ae0e64cbd2ed56f8afc9c +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcfb6d81df9036b4a96fe82087ada4e233f7ce00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6b62a63cedaff9608d58588a95f32b24acaa897d3c43f814bb1973ca4c8e397 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6519c9b145608fb00f99819ecbf1f2863dbdc98a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5443665d629b6c5fae9efdb678f52b131b5c3ee13fb0976b176d1eb6a59471d2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fe0ba1ccc9e955bb43611fd9f449c1cf3c63b46 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab456d5bc6581e818bc7fb09825f70a4f334c3f299da1554d0bc312757294f2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7c57c36fbb014c99d1b1c3b2f167643e25521cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:204a8a7e0d4171703f25151eb6e3991fb1a08d6fc177917312f6dc3532a2ac41 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7584d9921a2ad00d2b77746cb91f0dbbf94f2434 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c3a59469eeb3b84ba20fd2e28792f69b07f4aa8bcfc38c50701071c6bbc083 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b21c494a4ffdf86e5dfcbed63239dada42b5a4c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:674040842b34657b930d5bf3353884d56d1beb0de09e0602ab4a16e474cf53cd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9e7d8247a135c64ed6429a350a784db7f1e8ed9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05a79d8be40d25258ce59d2e798163b74cca2de3d15f4f96d0e4a28170ecdffe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6844fca4e9b408d79d2145778349f3dc232ae5cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91a4112e846429c2d494f96998517f7c7b811f643059b1a9a293acf174772282 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a5d63e02216e5f4eb8c0f3e96884f84b1bd14cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d649e0a85ec9227bfce8e07196794fa618c54c4cdc8fa56b70d247ddfa344f4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be99d1820a8b606d30d005b173b2ae5cc8bb0130 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b11e5ca29818c8b64fc3f7526e7232604aaa408370f2a8ac0c75eba654a97c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6607456a42e14f86510dda4e2929773756e027aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b6fd39bb09c0dec82505d75eebf6f6e38cbff2c745c4355c042c0466d738c31 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..180fa2a81c34e326d0141c53607732169268acf1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e453c63155e3272a8d8167bf4f6d6b77d4a2735c935dca94b66675d4d3e9c969 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2a8b70219da7b0b7683fd4373b68870067cf5ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c48daac45fb0d1413a98258d2c23767df072899ca439dd8675eb9dfdf0c88dd3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..286a0674ab901c9c3849cd2a2d54892fc1426aaa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77d8d05ad43bb8f7ec0c17dcf87ccfe0defd91973d371807fc8de3a9a5fef448 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6290def28f8bc7ae4b9dba5be67842a9700e7080 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:897d1082a8695bfad407478c5858bb5b1f91de5d048d28ae04926e3cd0f0c992 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31236d59436ec7d7b80e03d63410b333d89f6df3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea751aa55aeb91fdbddb3dcd160eab1b20eba5e0d79b25df71aa4b5b81ac03f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a103d69972785a0a4f3455f7c7b7d8ac038263f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75b01c8f9a379878f44889d4b9e981149e2e4450904e0c45ce52199eaa73b296 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbc3415645d6e97e3a826e4ab41fc145b1d23796 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59a806ba6455b04bd935275e5c40fb69eb3a8d29411d302ce9487bd8476f705e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..865218b8bae38656cc45222fb147e4f32ba2b963 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58c341e65440d50c70219e03c365612aeb2cd07850bb070ab94722af8156100f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab57d56c7aceb23adcc609112d5b30bd61e3e32f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc8c25750aa1fd506ed3625f049ef6fecbc8e34ef10793ae6752706406beb9ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3313407e322edca0c67a126f49dac793529f0669 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087e876d52012a40d35bcb3b61d8f0d9279ef2f39d14dac88103445dffa7e4c4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7961aef4a485c46b206333ff79ca16abba85d69 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57ec730863190d8c42fbf19a1fc2c4d897fc06dc756afe08c43d9ea3e3ffce7d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a4a84ae3e43df15d120786cb54937c59c8ac9fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ba26a1c0b8ad8a02cd42db09445743a1954baccf61d691b5291c90de50a787f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72dffc0bd1d1e9d6b5d8ca8c863009e6a0206e92 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:145f095d33b1522a33a4b223df38cc97ca18ca2b30b56f798a06507a7e24d6ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cee1d69b41e204eb95b562e5ef95146f59ffed3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b5df3fc0477626c41d065f79df12487d9361dd32a20c1870097750151f27de4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0360bfd1e5b9c1d63d314e26fa3d4289472836d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44959376d19fd840e719a0b904cd375c6b1568d6500902f51a9253136cef7445 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..44d5fb3d084d37f2be1ab34169cb66ddbf974f92 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1d23a5f7493ae8bb670042c7106ebf316d1e6cca8cbfd5df1091a09fad67153 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cc7ed2406a4d39158ac05a8a44f6a014019054b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4abb163e491095630355add4e59a96d0c75edba151c12ee45a14facadc8d4a01 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1149dec0421a068d2530ba718b85db7917be9f9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f7d695158d2843305cd4c7ec645069569036291bee0109bba4e9b27ad06215 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10c0f56c031a543068dd414096133d2f2a275003 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9aaebe6e14fa34e1a11989df20ae32945e31333d8cd525c10f7478047e30906 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..09c133464d61f1a653edfa08234f2525718d8091 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9adf110f25eed3b8875d127fc26cef758658fedb5d82262fff034c738cfd3cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55a42cdfc9857b62de81569daaf0f19db1d2a852 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949f37cd3b7aa6a630e8034e430407a16301451b6c280a39f8ee4d68c6f3b6b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d531fde0c6ffc365fa60b60694574ef2ad21bdd5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18cc3c6f821158b00c733edda0569b777517eba8120eabf31eaf892f8a15fabb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..971916a000238afded6bc5d31ec7d6a5321f0eec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb079728bd1099bac295ef361321b9d57809c2e82029accb7116b192e34dba3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48637f888dbe93a2a9cf5c120039c9af85a06ae7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c80f083d2c93cabaf2dbb24cfca36cf35f90bede70ac9a2a539d591476680ec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f61bd6b8af107e76e5c77d3e4201c56d1c5cfe5e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3924aa233536477208af4efa84a592d0b63baf44a38f4db817e406d92d66030 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b12c0eade27c1ae7e22bfd267e780d0c91f18ca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee30ca2dae6c6b6ac7aae33ed177538d05940c9c72a91df6a82c70133c81cd75 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..524a6fd1c2fbdfa13d704084884d55d52c9fa6b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce250a6659315ff70ad8bbbd53b2c1a7c48946122991d7b74a6d058d0b0c39ad +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f410e31728df473a923a8541d1c75f4b25f4418 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ccdd724a1113abc65ccad67c8826b5dbcac6f8024918bd52c2d1b96ddedd6c0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59ef0a35bd66dd39c1e878030616cb3ce4ca0dac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0f9c0c1baea1d2f7245f41ba37d0dc412491f0b1dab07486f73d7f7ecc0c94b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31d80af5510dd879eee2d005d4c3734b1c5c680b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48a5a47133c2ecd030f5f437a5fec88f517396ee53c5a36e0bf8c501e60304fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..610d7a6c911c9dd3419f76293a38c46302350811 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e435c33a8a23ca7029f5872f296991d48a360052512363f7744b7647c50dc7c8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8ecc50b6c1859f126b3bcd679d87a684a77f348 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb04daa838b47a374828c4afd6aa6fa301a5864e1cbbc39cce81e70402d4fd9a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f473a8994190dd11d6fe208157b3c4fdcc0036d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2500952b9df210b6ea366324d5a7e3cd64c7db08ab50ac75506c9b9f34fada1c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c8fc838874298fc87c12219dd79f6c55e185af4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09db76002b66968a57d560d5ce83999f365da7fd115262febc198cb00472d0b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcc41c122987591f5e62817c2d53da7f510eaa11 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e05f6d7a93d949c4ebdbda415f891a8f680d61acadff5465544b576009c49cba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c2a1e9eaacc8059b497959ab71ffb3202795cbb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e0982bc6bf953e11bce306aa9eb2b086ef21341f3a825ce57db834da2e36dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f7d5270648851c954ad738a6825833e66c8f3d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6ca0b677b2b7f0ed2d5118d57e9cde52188e847c5b013cfea075151cf764ea6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..da9aeb516491e38e592f7b525f7a07dba0252dbb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3782a4b48139597870b5cc62a0c38a1b7d72715c106d3dd1feb5948c56fc90 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0596df4ce2a4c0d62bf736a9027bbb5206de515 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1d486b8ecf4650b2126d77a8b908b73416df1894b39f78c2886e89afc1fe80e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69a698f00dd210ae6a743ef2734549460cd2fb42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c2cf58f280fd132885badadaf6ce8e55a4e47d422b7d8d43b20c2a3e56b59ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..125bba060c981a4a52dde5ad8f90512d6cf77ec7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be5b4eded29f9c42e142f047f29807bc5e26d128c9394a10a70ece827d822e0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..da205d695f78fe839174a51c3ad3147ca0196c53 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db7e839d2fbb34c0fcda1e90a513b05e7e62d2f785d179ed6717af96d99334f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25c740ea58c1a7ac107332a959310f63d40cd49d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e82897e2012a1360c2075510eff3b1ff302b2de70d8d4ded4a11e42fff231849 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aefeb40fda5648be1005d52ab19cb691bcdb5833 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b3f138a04e082ee647e88c80a0cff2081efc4c758b80b2e8d0a3ead235c080 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c89aaa0fa093be5c6d26adf44eb0d61d72b6f93 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed84b8c08ba45f6da487d513b2da7cea2d0f9c4a0c17fad0de3b59d9a1a6ae03 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31bbf92e5e63e0d1418fc5b7dd1b90d734740baf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cae801c161bc841e61a44a6e026a7e40dd9264e547250f5f6aa451e0cb95ce6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c91415c476c49dbafa3ec700d489b2f64eea994e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8876d00d020c0c0172f688b539198b0e83a716698d3b8e7e32ee5f97e497267 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6d7e20b42ec07725cf8d44ba76c84066e48fc28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0086a7b5428e807ad42e7bb42d456ac8e3a66a123aecd72e7c165c971dfe06e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3b0576c24f4feefa9dd74ff5472ef4819c5fa75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8950658df46ac506f037ef01f56b651e981a5b9d1ed1dccdae98022f34349919 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f2949cfa1b8f8a170f56b7ef091325317b2f04b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec5574f657f81cadeec5105011f5c0b5aa2186ec6ee56ce1c252d23ccde22f77 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7c5abf91a8bd2a62bb42dbdffb81fa641f9013b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e5473b5a32dbcdd5de54b4f64e044af33db99150fcfe5075cb0ae6cbda1f37d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e66f2aaf0ceed8dd0ea9fb5059f20390c9737c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8b53630931d1d929a3c58e9fbcd8608daa613c95140b55263e0d2dd7db37281 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ea8ac34cf1c24cce4c108738707490f53d9c7c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53e5359ad25778e6cc5da6d713e48f4840a751ef280fb5cf2af2deaf0801fbf9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eee4bbe7c4a9f20cddeb2b9199b8ebbf3aa31c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40f08d9bb09fb9025c30a24202feec1eb46210bdbeb28dba78bb1bd9c22340ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5985dcc5cc912e161432f38328e6628f132561cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29781bd531da03e590bfdc458ad869502f5fdb69b5920e67d5af57940a4d3626 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d81e5dfabfc9bd00a74f5cc0e7abb87a6868c96b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a38d31db8b9b529c10282ca53512a6cf0c7023e86a283073859015908a4af3b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c0432b4c1da41df5aad63ef65bb2dac4d03508b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e42f008825b0d9a87a25cb0396c8a26cea221a99efdbaa35b6c25b6283421842 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0a4d92933100f351651e169942d0fed8e1c0451 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d743e2e6610a3466ace08a68390ca6a3367bf595ef74d3ad03d9968dc0e9d46 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9d03e769a38db62e9ee3cdf200907c9d381bce1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31d7aa0aff9b6f6a9e29524d62265f781dd8f3e5825162e8c48baf21de823e33 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86cbf9903ef7e61d5d1e6b0da068527b01d43e52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87ea328412118fcab570cbf8bf03473647c3b770fa8322d9c95ae84749cbd76c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb8cfc1087fa0554c19ddfe22acb8b0e402cefa6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a161f2d32d4c60fe93f86734068a52367bfa70f1a72285881f8370f712c56908 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03fcbcfb7f31c9bfbae62678e565fa1dac59022b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36826e259eff83d2a89a25e9c2e70ce387a4ba19b23825e5133f2df934791aba +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f96582e560118479c6c9f03d4b31db53410901e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:948a0bb4a24e1fb89934759ed45650652009420caa2767516dcaec7539ca42cb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad8e3ce27ebfbcecf36b696b51ef15ebca7aef1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3182cd26ed2dcdfa24b37bb8519fb9ba273d5c6ded6f979d248da3bfaaddaa30 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..086ff632548792a68ba23625452e048bcebbaa1a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:323fbd6d16909390437efff97144a1cd1583e219e715ccddec6bc9a3d27dd418 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ebd47d6178363d888b1e485f415baeb8cbad6a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eaea378658f9de7a7010ae3024f567a0bb3f597e147e270371c1a6b63eb4c23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bd2c8f0376aa750cf21de634728a91f61448608 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cbbe5865e8c4f6ea6e973629d2987a5d45d806ec7986c584c9b19560df7f6e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e02553dc1c14bea0ebe7e2264031f6b1c028d5d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:775860d04488ae9c661da4cb9364945af7a3ed011f6e89cd6483a05ebadad785 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5715f6e62985a5c58b8911ee6afc6864b85b2272 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b862648b8fb9be2ea829176b37d054831effaef53f95582d363578fc3546418 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00cc23d9484a1518b7104ab811eaca77d35b9d90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6865b79c817f39f3b5b911c47a6d1a9e951f814c551f5d01fd20e2c6d4d3b194 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e9676ecc9534dfbb032fbc1548f0763504458c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1222286c466f2015776c9e2a983e620467f1bf3afe6c297a3233ffb249a1453b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..414c452ad332783a2c87f11ee23cd1cfa1f02ba0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c43148be6c65fa76822e74f4cab9285e1fa9fc29ef591cd07db0f9c0c16d6ac3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..146e52d9cae06534544c0d7fcbe642782c44863a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c6ebe3873426698dde1fca93fb4e887cb574b1eebb201bef0e34f1d10d36531 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2092d513ea1126ced5b3e58b186d64b9126f43ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c23b1e20cdde4ea8ceaf34fde54ad13b6576c3b726b03a6e35739cef17cdef28 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd94deaf0d90ffed900a5b6d7a5d67c2330eb369 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d93a289fb820a3eb324a9f5a36c1af57963f905f114209de7177fa41d1fc4b50 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed11b95572ea1f380d385e247858c5407f3e1220 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6196f47244ed78d5f56a61d4b57486df7f21ddf40eeb8af99f4242679b2ae3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed49440d32c4558f0e155e80f4e7a70c68da7ac8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:714852061887444fb9b40d1d89d04afb14328cf0ef3ad081b644ad49cbf98433 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7de17853fd473010938756536d2f8a0629aa0c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d036a6a01b19bb69fc7897e6f7c4bf65e91b55b56916f51e6d91dec873c2ed51 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7de82c4570353c4e7ef773e652af7e92ef7390a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2910267292cf8deb45322be0c31bbb349a5692efee8ada6315bdb5e0a32a5c1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d860530299aa02266552ad9ae31442269dba4d1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd91ad0102e3995162d8844ef47dc082bb9b98ed396bfe2f8c41b8e08a7764fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc7930777979648f70fabc122eb7b3f69ddd30f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a718e2bf5074f4841b3fb66cb10a646a7ee6c53f38ccc166b4492a24a7219337 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d744745fcdadecd151177502ff1c039f58f146b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654ced76a7432bd48aaa4d6cc0e2deb9e44f6e1afc5bf572a130fd6a264adf55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69efd169826e2129708e80c682caef72ed330fbe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd6d31bab397ac271519d098143fc669cb7ddfda100bd001c402ffa032b81210 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..82af2a3967ecc1ea8856e78d566b5ace38804333 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d593f39aae3d7068bee8d388793fd8c5937d07d4ae1a36439b9d71db1f968b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0f6367e088f5ba4de9122c1b3760da02461f653 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:054493aab260065825c7e9d6415b5687a73bc204f3d393af2319a12b25b82cea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..72c4aedeb9adc2717a2fa4b4fe922d69fcf88695 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f87ebecf42b1b24c60ed6a743815af931f33862a683b3aa6385cb4628230bf5c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8bfd864f8dd3b6715e527bd683501a458b2eccd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35b8c4263ccec65b9705eb301560e8d8263455ee79c63632fc22a8d0c99ea967 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3017e4eac605468764fd9fbb47392b54a0a2c867 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:170fe9886051a4cc3dd733ffee0d19163566e007a2c34f0d1b56e0a9ab1e0acb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e874e137de49a67c8faaef29d5abd346c980e767 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5afe39571e59acbc871376c218c90596c5ee8d57b3940f7c3aa63079cd86a577 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a8ea3ff35cb8af502eb572c508ad2049b659689 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d24d1d8ec92ce50806f6656fb3fa22d0cca0f5823b5f4edce10c36dffa8e0a74 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c01fef653707091fe8366b96c66f7aece024f2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64644704206473b09a27a1d594543318ee2b50d33ebfdd60a73d210960892c49 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..60ea5f377d1757711ff1cb2a8f4573af48809891 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e1d54cf8debf6e59f2df62b8a0bcf5294a72d3196a8b9fa642d828f25ab5ff2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b367f0978d35a21bcade1e5296daea4451f54a96 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edfc687775c7f89a5259f2441b270a1a20247a1630ea41fd2fa22847603f945d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bb80aceda2d82884d6405f02424e1937912e8fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c7ec4c4656f1e508df108f1f20673199374c6f707861fb65099491ac400245 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b060ecd3fa8b965ce953192f8eeae05c4d3f53a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69391af8661921c9b809b023bacebfbdaf978de628625225eb64874b64ead669 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5b2a19597ecbc8e285b25e7c07293f772378735 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a681ea964e86a01783297b0f8428ccc570c343aa6253e959925dfe637538028f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f49a8664d89760c48e1f53371262944d81aceea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4033454770eecf3802d4277b0351e40ed7a6a32b050398faf0abf66e18ad727c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4655f0b35458920d724f71a58b0ccc4a09d57692 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ada914115726f1eabda20e3f94d9a8df3e01ca90c124d84aa81b3a7ac16585c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6831e9fc62b3fe877c45e9d5d8ec745efc2abb67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29901fb915f9d13a68b9c4f2882addd86a5296861cf1edc4966346d8c9d9e840 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d42b3be83e818f2f46a01a10f9fac2f298610709 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c4c863d2b05d419ecf88bdd2086679d98c20daff3cbc90e316bc1d3db650072 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30037a4ac5e813c93af8bb015ac598fd06fe7797 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9e718c87be7dda9a2c550cf3cf562230f82ab1c0b23dbdf98fa9ec0a0cffa13 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c98ac709fb36a96a21abc4e1ae745d2b8fd3cfbd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bd90f3d4e666fe10ee3ce87fd5181c8d390eb35c091bb274e3945e2876961e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a95cf69cc14995eeadc0afade603874a1644b4f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94a7a52abd1bf68236da82df40b62e6191e0ffe0236f95b2ff197a3c44c2b2b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..56dbe1557a9b035ae278d03626f6f470a630941f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80870be08979508ba63815c346c11288600a45c81b34cebd0a40e19da52ff7e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d25efa6977513bdb398b4438eace407c7c6b219 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3e7c471c8cbc2423ae45d859d6f0976cecc0426f3e8ce1899802d026a030da8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..45438d7054695cdcb24439109a2cf12445be8a54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76cae3e18d3bb271882ef85a26671eb25b5b98d9c9477a359e2505cdd66d2f29 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc96e4850cb7579fae9dc6140f08d68d2bb55cde --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5a332528120628913addec685ef6169c5c0d069ef832980944556af5bd0c66e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5774eac4b20a8c1e5c690313c1020c570d34193 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c74b582b9023c2b8acb5abd287af1a16a265edaf558e7ccddc38f9eb6404a5b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39ab8d3d0bd7332bd6a7cbe9a0051417d158c19b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffcbdba8e341000ba68cb7be4fded5cb04dc8c2746dca5784741ba5891c567f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d39f4a244b3dbfe34ea808b5a956d109fc38930 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1ff31c3d46979104dbec34a79f2ee00a44f77d4beb5108110ee4df455db9f79 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e77b37a6ffa13740234a23ef408ee40c624e4ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42796325c72c3619a6363a65bfe1dca160d29d3b133a626fbe7a9b447318373d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c26079c1583c145f765e728ddb5e0ff7919294f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31aa42400282038ecfec16fa33b68b45962281f500914bf12953ecc78d6b6b7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d9b4156be7913a7f87db9e34c82ad8bc161cd71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e72a9a8d0825008daae23afa6c14dd92d4ddb764441ac2530d37d8581ff75881 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd962b0004056b31eb83f1814aacf3f700f4abcf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6b1b5795b3035ec4bacb16140c88a332d4d3f75a321be5599e548ca3b5ecdc9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11e6445732c497590ffe01a7e7bcc0042a873ddd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5a0588e1e43eaed0e3a4b07dcad4370c74801502fb5cb7aeb8d24d05304352d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec4d11a5e8020d7650ebec1c5c20f52092cb2563 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f592bb54f04c2b1bb84ebb700ae05b570e50182ac5908f935a67e7ff51859c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..368bc1da914be5387f291da9c78814f1f9d9200d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c7e689a403d4936a673887fd89aca6644fdfae4c9556a54572771423f2ff33f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b16dc12cefe13f9343d36425571db14426199e4e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94f18432df5ea22397a80dc5f78465a1a5f8e62a06be24bec010978bbcae1e01 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cf36d65420cc093671262349c565d637ee364a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71104cdb82fab216181a4eb52336b59d495e8cec83f0fc0db6d0cc35887f5988 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b860974ad862ebafa74f48026822247e88df1f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd41ff5f7a5ba0f7e4b3220acace288afdc023ad9b88bbb6289ed522292e2818 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e3e6c9253db342be177bd2d3da6bbc1d3efcaa1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b178cb782acb3e2d11bf6861533491b07d076c914471a75ea4dfa926ec26da +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb4ea678e428b75385a75201ad342d55c852f799 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:804a3bcafe3589ec512579db1a4f3bc941aca26e997f5ecc07ffec4c37f8ad02 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2b29b4c463c74094abc8d644632ad3945a4796e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0fb0041e07414ee14a46429562939cfacad17cddae571d23c7911852c65dfaa +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2ce52c4ff8eb2051dd1cb0481b20092a4700629 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af25311853db5c0b7ad564e2c680288d827e499fac3933f298655057740efcbd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aad5417c35d90625acb39de5bc90e1660dc26321 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:158499b4e671deb5f0f37890674d3bf076b8104b1e2b23c4e4433be200510079 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a1bd63af101b6e6cb66013acef1f6a35ad6c928 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486b24aaf39fa98386c48874d4825ab4ca9669449921ddfc3bcea24aee96779a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8283c35a8e43606260ca79996de6480e4abe5fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbde1b4ef0f5dccc28d7668e69fbb6c4fed0b8d917b0706eb7c250ef28c292b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b624637bfb0d5a936a0b79cdd1241b233d3f3bcd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f87a040004ec19b0c980862e36678e2408ce3f86d8255d92b6d21028aef3bb6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a727e0203891d75265c81611bddaef31c13d0e0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd1f7675149283b732d6a0a239fb4c03b5c40a0f67f931f17c2d75f7df8dda79 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc16a49da5a7d90e3d906e78ace37aa1bfe42113 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23ae20b3233a8173220f1cc385c0a8bc28387a5895c866302409fed85c598fa3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ba7b1266db9f28557bea96c999d23994c5fb373 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e04b0b77a1f55ea4aae87ceb62836a301bdd73726d642feac609465699af6ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d84767310d47d1d2f04eec128868fcec4923f455 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b20804415b1d25fb6e4a9ab11bc0b0aed2cf074aea1349e52511e71f98ba5d81 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..476a7cc204a2757eb3e166ab0109dfd080d52d15 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e28ad4aa34bdabb3e1af5cb3e7b6a80c99eddec23a4280d64a0899158cc017e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d342a5d94a929547b5fe5f792c156f4dd804ed0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1beff664f9d05cab5c0e7fe64ddaea2340e988d0e2612c65df63956ab6c863fe +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f4c229f90945ab36e1b6bc989977075bec964f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:960c9268215e269db2f669e6f206f002e251e1242fdf87f0230e99a6e076ccac +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2fe66688c8bdf1b4d0309727d318b5cfeb39f7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c625607f166767a49b1d517c0f23078821157c3903d5442e2f9bd515af9ef870 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ed3ddb7eee3c72ff590ea0da5ac56f6915467b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb4db91def0dd0899aaf4b49d9bd9ea8ee24584208b104a7ef9e239c41eb8b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef38bbabae8782f6759baa9f86b83f94be530ff0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b3b7bb74c7a7d49261f549126624f24d6dd2506557100472d766d8a57107a60 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e67332bde21f23c4df1ed112507bc97f85ce3bd5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65fed58d7a9095da7859245efaa83c0eada6a4af826f3d3076fa9b21c90c7662 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb11582fb8dc189a9dba4013d1462cfd183824c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f2cee555371ba5a2da37dd50890bd46efa3fbdc12b8e0f764cbd5299d04fe59 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6c00f07d08b7cbc4e6f570cac89eabd15c1bcbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81eb1fed1d8a3ccbb3ace95677b1d300436413777e96d0478572c92dbc561e86 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08c0aaf7e588e277eddafd7fa421c0acb6ae6b2a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5569804aa1a9bd9b53202f6b432884278861b4117679685f663adc0bf08c0aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57b4829b2c5a1da0c90f1d94c93b6ddede1e5a51 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcab0ce3bb04292f07628ab11176863a6e18163830078e3a6c30514efcb29714 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b01dee2782d87a520ec5b51955dccbce166991f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4989f8a0d211913f22064729a7b950dcf4b82be67d360e1882f76bf2ae0326bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bce7bb26c26ec02d065db79c19196b05b1e0fa4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ce71339f5928b0d927514635c4d53453414229ac63083594b495ddf7f718964 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c87ae9276f65b138bb5905cc9c3838cf94782013 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b308c76aaca871e9e2fb99382c57fef2a95cb9445a4feecc254781df25faa579 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0718f95db2613f349794b1bb91e09bff2f9e19c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b1cd7cb8771e10073765f7a8ce9cf7b7d0d58465ff6e36a68558396af707479 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0a29ccf9f4d138f8b0fbaddedb8918689dcb7c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:445e2ee1fba6fba623b0cc555c29cec0d76b405d9f00e2166565a74c1d8ea686 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b03fc2f6440f37ddf377babfd40e5727bf3056ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9218fc805da0813d0f9446f2c69a40a7e6137e3a4f94562d11db2a83e1d28fac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b57a237529ed5a7036845379fc21670121fac4cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556502e136db47e889fd7cb9d2fee5cf4e69456ebef94a2c57a6d312fd19da70 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f96142b95c5ac05b071145f2a2898a7be1f06a29 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88a38ab6b7fce75094f8f4e1748c7c9829792007953dd0904840d38bf90b1910 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8b4f414e80efa1dc9aefa76a37581d843b78f32 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb5f23546575b897d22048021313af45d2d013995b39eb180e850071a941429e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0485ce1057d141396488d8aac1f5497fd5b815fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d22fb324c0f3e5c3c189517826481b4daabc1d1e954343d99844d41f3068f650 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d3e9709dad6349d9d9b97ad0ee7e72464669c78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f931e780902112d5f57f04e04ab1f9a00861dd7974d79d38169449c2f6d978 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c91274d5f618e832a04013e6b40d8e3661739f34 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30f5c1c69b856f0604922d32a3285de1620b4adabc41942bb644df2071604107 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b095b3ad36a2a4c122b43b58896b717d585dda78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91ea169721520392971b9614e3fb88d5aa7a62e6d381e1265afb96bc8a032eb3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8d0ace865c958eb9c6b0053f014ebb62068b024 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49bfc512c224d697071f9e61962f6d193adbcf74d1c3918c36182189484dc648 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..39f7af1439d2fc26d73bfca829b8ea35f3b7345a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a29e4aaa3d64186ccd57dce10d8d30aadb99b3423f240216ead1e845af48b3d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..802fd1872f404ffe8dc5aaeae3732270f72b6b3f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd658376d01cd47a766a758b0df587549c3ce98f0db2139191de3289311bdcd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db29439d55b06ae28791dc6453f1c1ebe63e371c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53bd2af83692311ff199eb5d6344dc2f3bd2bd33f29ed006aa30a9f86c8e694e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..67e8109f01edfb730f62570b04e47b47031ab097 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e7342a5f26dcf5fd4d75bf81b931c6b38a36b5ef174a215b048de0152eb803f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9649a0577d4aae8e49aefe40e9348934da37ac96 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b82393f877276e39830bd06cd5b34d090a650b4e6ad1d853dc557be044280171 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58109f57c069b0c5f27cd9a1ef523c7581ce605f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c52af72af98456297b0801ae920e4bc48ac77c06668d272c9098d6cdcc9929e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa84b82bcf13f3ef55ed841466cb03b4156d00c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f3fee5e6d3a055830c3b1b9e3478de4620a7df44d4d35fd6f5ce6f384d98fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22bd8adbd47415b90af8dc1449672c0fc11a9706 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:933dbaa0383275f905505f6be6a173b84d8b2395b16b80114d976575f672856d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ab6f9ac829d91bba110b5f85b6f7107c10f0af9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa832737128accf9a329835a4b3c03ebdd29f99ef53adb499324086ad2b1095b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32b85cd66e9e612f90ce83660af55578da579932 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56f074f03134bdd080868a8eda804c811468c1714630f32242775fc530c69c64 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0de85a662efbc106c013512eb77d5fd392b76a41 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df7b6ee8ff58bd7b4108951a3255358b7be5f71f7b01a4b5b4ccb52094a6e12e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e91b1f08f09a4f9a2d8b9d22c65a361ce529570 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddd06665a2e1d89071815269be45346f8d5c765bfc29dbfaeb4a2a94d03b33d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..af5bd9178028e27f9145c23528b4dc9e0a62edd4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e35f4fe7c078c0d55e7027cdb3e771cbea008ec424100148b11a5d00e1dcc3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b20f37ca475dc55761462f75fa7768c6e9f8091d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dc36dcbb9cd19a7e929e702118e01e478fa88b962f04ed4a24ba37acee39742 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c513b381896ec976406b2c4bb64b36b85cf9c663 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ba2df9c1aa987ab854bf5b8fa63f5cbf71ea642a734e397de6bd940d21d149 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c694ad66a639eca061d458278fe7c04631a4983 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:600b3f26121cd767683f122b8f68bdf100f4dae0eacf4318143bb4c834e6fc90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a39b64d317c0504a70795345f72fd41268d9f54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ff55c2c464fd79153dccb93ebc2082bee1ccca5f4a355a8a7c9a4630d6c778e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f8c297c0d5f4a3899415442ac3cca9ea69264cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23036053bacd9bba14434dde197d0e5c246ffeb68ac8b93e6ed28c576a1407b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0a69f28e8a49c7fc39fdb31100e70490b617e7c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b3c7c49b107bf23c3536c68f5738103467bf41b033bf10257a884cb6594e67b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53ed95b169e284673639d4c17858a4bb086b5c57 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47a59eb3754e6d94987b4d3c015470be4d3ad30f907b3b70fc1e5a3278c2c3a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64e6718e32f8805ad6ef33f9e8d5fe48e35198fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:498da100beac139c1a0d72c2d98efdbee8fad7b4c50097079e05b9edc7f6c413 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b76fc43d6e01353461bc65dcdb3814c8071fbda3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efb4427a4a3fa59df8ae70633dab084f29c9df09eb41bb513324afb2a4e9893a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..633577e7606aa5015edb8a06e6fdfd40ffebdda9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fa7be94638565879d0e3254bfb99ce3f62b58d54596587a10cdb4bdbd6d3573 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16d7e8843c63adf99c70a248e2992eeef1e25d48 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc09dcf170564fde49efae9104fad3d0fb5290e3a7ffcf6346baf53b1c64e27e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b8ebc9a79fe079a925cbd4c6282ddfb5ad8de5e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfd51f0432a67f61b1ea06ec10c6016fa69994f47ecb135eda0b5c4f510d399f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..919904a08290b6d7e48f535d693cd611826bd574 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:312204ec3ba81de6adcdb7079193be79f08fbef9337323235f20952b24550f3e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..afaa357f3b47dba6633bd7bf8848d70ee1067be8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc86dba4538765f2a95e8e767778cce99a4d89f2c5ca59d2a11f2e5ac50761be +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b78935bd8bfd88105e87db753aa42171ddacdf80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2525abd495f4742077b48eebf9d51fa3268b5f9b6890ec98b1f2e63d7ab1bb6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..822ed8b7e546806b1e9d2c9201ec4ee2d513ef36 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27cccd514f35121dbd6bdd3c25092def0ce7a7e6adb901f999a6b99cb55a27fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dea5aa3b4929d4e614c4b26da5ce3a4c9f7ac63 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c632af96b999a4bca2dbb887c07cc13d5d1eaa6de20fcc24f0e1a8841c62951 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b003839bd3571ba2a616cdcad0547c7fe4e25e4e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba9da69b13f82810863b5fb4d0788827dc9211dca914bf9aa1429d4d412a9873 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ea0216f79310d721948583ad8c9a46411398ad0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:634074977ba639f545ba99a67217012754b2bddcb2c5d701d4bf26da448e0cd6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dab49dd2b237dab72573a87826a5db5e0d1d00e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21eb8c82e3fb269b82f1a34fb4bcd8d72a0a104800be94c6042140d029ae9225 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..508c4a1582b8450021b9de01dae4d144d473fcb2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f88547c0a7104b352e5b309aecce5fa6001e5e4face572a5a1a9903b7098f2f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a3eda49c3646b4c8563fcac31969a4d9a82ff68 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e731976e0424c2442a9be780ae8006410a533abc2de245f83c9be12ae0cb0cb2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..321c9552dcc17627432c8b01ac73a6fac856dda9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb2ba38e0da7498686ae79edd5d581fa8a99feb221c7fe666d39719c1eea495 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bc24a7f5d14c0986014eef39a1c259bf853ab68 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f151510b021f52a2f18f2e90b3caea31facd0ca9fb46f3104e5681068a544ffe +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0aea4299863364960b3df1ae56677e6746ed257 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:578b2daa20e881f1d8c93a2ee3ba4ceadcb67edf859b5e51337c15b029d8b67b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..964737233e31e68228e909663f76de069e979685 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621511f5e30e13cf1f299a621facc5efdf5b3e6626895bcd2d189d0f13e379d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad2bac32a045b53d000a953e1d6db273d1086cf2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4514f4c5e6627bfaafaf3c3a72551d5f51ff838c18a5aebf54e4e81f6c4903f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f15fcef031ca789a8965795e3b9b9d0d8f58b0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f68050fc0ac25089a6c23bc3b708c5c72c9a78b134cf4735d8f5a1a37e3a9ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b23a2507128d6a1a0224999ea88724eb068784ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc34086ebf44c86a13385251bdeba936db9db70a7276ce2266139c82ff39ee8b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a75a9b9feb0354e0fc30326798124ab513116684 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eeda58b32e31944cdefa2fa8a0bed498499ef0fe610c3dea0a0ca09824e278c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fea87ff53787dc51051da9cff3dc96cf2a7e44ea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:237b06d8a712c8eecbf91b6d85f605424826c6b9f876f0c828c3e549655247c0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52e3ae7e11fa39bcb697038d39defd2b58b0d382 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe5d64b473fe27442b5a8eb3fe38bbc4e958b35c9edd80462ccc029c601b89fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b72d330a2ec2e14073b636808fa4fc0ea305de7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8da2264e5a519864f3dbec3e9d0111a6dc411a4557a4b467b8c5c3a1280adb68 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a62a42d02ea72e0651d0778ed2be821e699966c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dda48646a6ab6aabb353c2eaa893a5b4633ee02934ae23de09145cab17914d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c673b545b770dce1c9dad0c15f3c497e39d2959 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d55889f7e02d7052a9f4e1194b01c96bf22f20111b1d620689c13e56cc073e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1aec1eb9b6138bd18f24c8843a3de86927d2fa92 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e240fcf6550a34d20d07fb07d83553570c7474dfeae7e45cb433ce4ba04a242d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2894aab6cb2f3c2a24f2c6fcaad7bc1b411b8584 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2936cfac23e78209b48b7953f6e1a74f54487283c560e3df166365cf559e4aa4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..976ab488ad0e16998ed1cd5b5042009444c50da0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e041f25b31bcee81832c7dacf424a7559184912ecd2169fdc2e562404716178a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2e4f614fd335c62452ada3338ecf0ccb9a8ff91 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f9ab04c41365df41ba02aa8469876218162fd704afa6f58b8ca842fe1dc628 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79eaba8f4723a80bd2027a0d2a116a1971574299 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6755e4f1ebd241a4cbf10e058addac9ea1ed7c2d6814a3a891cec43a5015f5a2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..354f65483a4f7f1a9aaba6addced9414e50b7962 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2934ce58b9841854a1dd1a50e5f6d0deab823ea816023a0b04ddd5d5d6488a3c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1222ca489bcda6221d61dc13f99027734f377c93 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7022f6cc9764af472ab5c32971fe9fb59e01e22046daaba6091cc00636277c12 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..033baf3497d8dcdb608673b9c01afa79dd47a244 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:726dca651432c7cd20db654f9d4e24bf1eee58d1f8e77d2a308ddeb98f559e8f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..054435e2619b4023aeca016fbb9f855d48aba8fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ec39e9200d74dc7c265dbc34665420bdbbf6b510b83c643dd407044397c9ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64556197ba6eba2ee926b697b08cb1c61a154285 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4207fa8a127302514c265556ab0664aa60aef700e59b56cb5f71510ef57f38ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c06ab4bc6db7b811d907a8e56ed30b3b58889a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f9190fa1d2ffcca1d2b514071a4a78b23e570b63cb6c2a803e28ced1401fbc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d80c45c9b922002806068dc59711a7a42446f6d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a114b231141512811f7baa229c11465b389a3874c09cb297750484f9367fe8f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca828076e473905acd4f782d6e23b89f6f870c31 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afde350439c30db053bc83d046c701344867618cb2958d7e79128e62bea5f10e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16a503f806e93b9f544ee90fe9875f44fd6a6d11 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:423eeaaf81975342ecdc6eda0d90e62f48b38f0fbce14a2516efa811bff3e1d7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..872da767dab93c8f96361af2d05bbad6690282d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c746ba13bf992163a098783ad157fa4efba86217d87ffb6a2c1b0f4889c64b95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e522a196824991b36431eed728acfd9ce9319f0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fa7bcda31d47c905dab7908fdf2e741eb859962ce89fb2cbb8cec2c0ccdaf2a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0a303e6ca128a11f2139532be19daca8475c465 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bf4853390c92426b2245017c74b5fa3604212827f7e8ea24d6a05c8da003558 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7602fafd487c3234d74becfee28cfcd7ad55bf9f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:789c55bce6bbdf7e404eff807cd6158995c69e6d7137543dcbd61fc7255df5af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a5f8a4fb49c07a4e64aacbfa409598d45fb1dbd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb21fd7bfb6cf8d6a69dc56d393cd292675601e580a825e0d839fa6f72b4ea84 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..140966ffa6c994a9798f9b6f8a9e265edf9285bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7acbc936b745308ea473a1f4f89c72010c579070fd15583f8ffbe669e81ca4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b055324b93a381ec0288b277382fa77418043dc5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c73cbe96171b5951e51575d6d79f2e5c09b237b80a51413cdb50f6aac143bc0f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0962653a65798a557ce1000e423732ff5cba14b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa277f097c8d43ab9938bd8078518eed855e69ec8fe94dc6319d2c9a74bfa5ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7440948df67ea9ea4d1e119e66b2daba8bc2b65 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b04a75075b9e57abc58f89a54ee3fc906fb14f857925eddc2ac4dcd5283678dd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8fbd7381274c9f84f1d6544ad270c9447e8558b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbbce606e8bf712877b9b30b0264238ed5b7d58d4eac798a6a3e582e5b18bd94 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2309066b8fcb6f436de8eecba6586f09ca2b016 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b263cae3e64467d41aa007db50967ed934f8599d0cf96fc8891c4d15db24504d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8aa34f029564f997877b7d0385b20d43eb05de6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab35c0dd1da91bb7f992ed85da01779526d502e7fa0559025bcece2ced5e1594 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b956bef47f184d7922c7d94cfd17b5d90593104 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfbaf4222fa0461b73fa844ec6d168848c2f6077a046ccffcea5dc478cd1e93d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88a61996159261fa55fe1ef2baebc52223dadd5d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce6c73b1b94e1b87a11444037b54d62b6c1494dcebe78f2780a86e4ef2494287 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eca0e46402251fa8129a12bbd3a4c33eaf3845a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1629c199ed97407e4e25706dd5a01baf0e6ec6a1556c1000a2f197beab3ce810 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e213487acb6c8681f726c4d4b49fbe9fbd29ef5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29232b7de6fec12b72dbf40340c80bfb915892d922f25da796fae2d96f89fb14 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..35c3e390982d2bc55c4361cdf75bc3f970fe400a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c769d93ae64ab356d6eccacd133d99e98bc213ad0df819360e944f2beae939d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3871045914bd0cdb9a4035e35b30e3ca6787a14f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1604ed68ee96c181c034809e560ffdb02156936534a02b18686d125f3588483a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..72e6560e05aaa6dca6a11e2ac3e05745a5804bca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d68876415fc91c43f2ee035d2aee8ee6d6bf9acfc99728d76c04b7b176aa2667 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbf8b8be8cf9708332ffb6a739b344884d7d34c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33cfc8afe362d765d2ca44ed0ce424ef8541396523e707182f87fa8738c9bc41 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf223c4914331a1fd8e702fabb76d860c396585 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c362743963d0bef1bc3cfb3c1d92430828f58bafe58eb501e0abf6be03e281a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a4add540a008b822337a841c590a6fcd1a53d0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a94b8feee38e924fb9e82f1d16a18ee48f718b111b08044cb23f6186dab72e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a22f7338cf56d7c44c894318c205c29ac9a1814 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e1e3422dcbef1e482ad4b885fd42e4cf7e59e15a970b6ca8c04a02ba2cfbee2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3054792ccdb894cc7f02519cf08aa8cb5f9892d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:916e22fb3b7cd82489c5ab05058259bb673afe6d0bdd8f0ccd35ed93700720aa +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba849ead15704685d9d6991fcf248426f9281647 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d9f67268ea4dcb50e497a4e49c5c1213b4e9ffceb7b5ac2e15ae0caff18592 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b3e3408819989379fc276c5d54bb897522a8882 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40b3af5874464bb87153cb71d57c6010d35de2cb7df966999744d498af334963 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dc95e5e39e6ce7ba20e4755862faa9d1a552c93 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de81b02dddfa41afac288f6946573ddd9af0392aa4bdf1fe14ec3d62be2a04b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e776e005cb95da7cdf2efbb5fafa968accf0706 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20db79c86967a70c8100c7da6dca86a3896914256100a95feb637ab1a1f9871c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d4169616a7dd50712503239639aca0048261fe9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1591bbf20fe20e104d3de6c128fc5a24b2c8781c41e9d69de25010df74d3563b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96f740c65689eeccb01610c42dbcc3d39a2d9c0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c9cd4f728a6930fa76be289b611005a1da5bfbe3edef4c6c2cece6fd9927aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0f3a7e9756ff723d2f80513d2339ef79f1b225d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071baca15be819431e252eeff1b0226a083d9efbfb6171c8b22c25356de4037e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9593452088ac518a1e43648083bc061f9136d588 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaca341463b48fd29873ca379101e8a0311fbeebcd69171bd1ba5bf33ce3a22a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..563564a80b7ca13495796d4e46365318350be171 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30cbc0b365440476968587ab92aab84ba74bcafb2022bbc1ce8dd32aef995d27 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..610b2998ee66dd77868def38070962928e83bc1a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c06bc909d01abd512c152f4f39eaa49b615a4189d97b991d17ae14f0fdce4c8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..42892c491352fb268e79b8967a839ea767d9e32d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97f7f20a776392c1b81595b4f1e08abca354569cc52ab2eec694773295b144f5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42cc64cda04a4510247d0da5e8ff25f99aa95b28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:103a60f7f4619b828614e28d2a3a1ba67614e345c68976d7cd18f3f8f07fc672 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9e32d21215c3eb95521a05fa5eb84a61c4ab47f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:984ffce833515502667c3af2869b4a5aefc83530845c11cd50d37e24274cab9f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6da7ec3d4c1070e7111c77de1fca3c0082a7a02 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71d4c272a87e3d96d06a6f711e8fd69401e73e30d9cc6b46cf351c4e63c207a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0790505632cf21ad2865ec75d90fb64069e1f73b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6279f3a20d1b483de59b0b46875822feb9c5f7a8ca59b19c4e1a94226dfc39a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac20ef0d2be8b96ce26152eaa735686f6e2d8761 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8007cfa470b3c1d34027343ec3b9aae3b03d7353ebccbaaf24daa765b932331f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7e0d26e1c112cde81cbd6f7de1dbc8ebc6f1a63 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d89672e33c2d54eda4a15b89cc870e3d37ead2f89c64fb86ece2de95cf5758 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9e7c63e78ed6708edeb3ed41c6523d488fd3df5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1371ac7ede157277d2a5928cc1efd19b40f8d47f15c5c6aac8671e19aba830c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4291a1029b1bfcc198d5307e42814fb383d9906 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3165de6ab5ef7d1f70c1b2d96a811a8de5bd9b84947889b06169a1ae8dae2b99 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..793fae9bb1be365bea5237a9599406068dbe5a0d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5807bbf000eab1a84ed0b48492ad7788881d289f8d0d0762347d8632e049d6c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..42c902abf25efcac6a92bc2b73cf96e3238a043f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73eedef00b9812fe5efd6f3d8f4454b53333826a72a6bedbfc2c88d5f3c4d599 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d84f89b1e2e8286cb195a908b010b718220478d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6c72b85f2681b3c5489d44c45df9bfb8074adbde624c3efbcbd2d763ec356ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c412d108c07b53b89c9d4ea8addd519fbaff86d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09b89f77a22a63d56feae9ea4e953b63d6f2ab60f1da9ed9976ac9ae5afd9f22 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1777a0d25ba8e616d3efd6eb17635ba4d2fc1611 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5a616c2436f51e46ddcd347f3146f26845f2cb8315812637b3c9bc053bc70eb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31a1c95296af4dfb8f37c64ac6d71e3782a0d903 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bc3d5c3f7e9fae26a82a76c37e73a0b1a129378b29daadfb7907ce1ae01732f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6639e8a5d6ffce2ace3ea37a5e4465f69195b386 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b483c8eda419433bcf2ff78aca2881d2634eea697021049347f7dc53fa957e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..779f33e85547345362321e9eb86f60b4ac14bfbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409cf10f6210b1cca653a6bcc48b40825527c53e356d06d4b0248b71f39794bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3588229d1d55fdef2333d10479a9b6731d19c514 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:881dbe8cd477aff9bfe52f49a1dc0442c8798bae13650b052c8c1098503eef24 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ccc34a3dd7929f214fde7f71a53ab05cf66d993 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12607dee627b7ceb61914526fe21d4473be89f1a1c4f465d8f6363f18ad45107 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bfec86b7e5a63be1a000e58f35c9a97073a54f1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13c4b9562eb29c7ca74c391fd583e5e53fac7c4428a1085bf43fa29ad7739ef4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fd34095a260894f7f715ebfc8f988a26ea80a51 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf0d555f4db65006c240ef5e28aae8e1437c2f48ecbc53870927d5d96f443741 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c83ad695132df209c27f8c1b3b8fd2138eacb64e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015001fe73db0eab1ff1ccc4a8d249380c9abfba8df0912e6834f3e4b0b52238 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..304d13c9dec0e7e8482dc83c0ff4d8c017f56d38 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30cba9b96c188964e75a4b7fa64d6df1a6fe70824c695c02b2a2c031c81df2ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c915978c73c87d92dd5c5e8d41f1718057364fc6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6ab72e46c117d5b515aac4571928705fa87b3945d4df92ab0611f266920dfa0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b02e7375f76ebac42486180024d987402e93d39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23979377ebbaf0bdadfb2ff2723a8481bdc4ab7ff10404c83e74adb3116e15b1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2acf43a4f8782d06ef96784ad66f0438141b790a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5755e7fde4aa21bf006b4c9266591f7481de11d7f1711605989ff5181ae5259a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..beea00ad66a9997a4786f64acdc41065b62e7cc2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:781c672e549b2114ef41c05659219df9f6ccbae957f3a76271a0a7713e6f7c78 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eed8756c93ea11168e493279f69e447c4c247366 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfd626f1404aeecf192b4056cf9c2f5d826de7a674dd0fe0e0a5165eff225f0a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b014a83d3ee111685ce5c282d30bb34214ad765 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:815f532c8fc2348a36b83922d33c8217380fd82c0ab7e97356c73f6da5a86933 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23fea773b428b344cbe4824d7826671a512efee6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47ab8af29cab17d3f10d6cb2ef6def232013a444c4a969e15d00d41cb0045249 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b407f61f99ccfd25e21f6551288cc0cc84cfd1fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caaf578791573b0dd872f5be70957b7314ef8afbb320f7a86f6085f78840af52 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e7d089ebf21fbb10ebd3103941bbf8bd095e5a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22bcf8b8ab7b37b0ba15d0699ac5c083349c5993c85dd46fb885b894c881cd04 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..73a108606f07c0286958354e51bc823ab1d05f99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:236d5739c54f7387b5557d61e172c8b9f10169c37e4706f9ef3435c03f050cb0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc0528e00e0e99fec8adb37405a6a5048ac46fc9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c26ea7b682a1153329da0449f1430ef0cf3354d6fe11a1736e2d88d67baff43 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4f75935de3e1d4fc0d4f69630e8151817a82be7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7d46dfc66af242e401992bad77557c0513e3e6edfc06ac2d4370a0129114f7a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ceadbf2788c12f5ddd757bb2a57171bfb41577c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4a7f48727e9e2b618ad2937fe8163f8cda27233cc670ede4ced27d1dbe7afc1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdd8300e76bfa289b4880e22aa7b002c167c381c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76c85c65ca8dbf55b68a6290bfe872e750f89550c9055943b4e7ce8081c7e2ff +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a53bffc1230d48f38cde0e3fe82ea07547403c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba42643ecb0eb591ea3ffcc4250d438fb5c6e05a89a6b308a5d88aad697300c0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3309c8659a2fd500d7983ce1fb92d27227eaadf1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4613696b8795d4db75a8b97ff7d9b588fb25d24ade98ae482f76c88200748a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..146ab552a5739df02231451ac22710827467e1e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb0e0cf3040665f2e0ff7059cc840fcfd58adc1c1d72c1d9a9ea926e212feb5a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffa755be5d48d62a04d9ac8742b99f6dbb971276 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c16785074c35cc4121e28ee7f1fa7dadf3561cf56abe79b060b7ce039b22a02 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d394b247c547088fabcee806e485398981bc168 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92eafa89f08e79cfec0eecea73c0a3edf538b18da316481f1c2f84bf5a214f60 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d48d61a8f61ab04dd0dadf4c314c1f8498e713a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:296e811ae83ea4e7f9d46bc3fd8845c7367fd499b094fb813805b1118b384891 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8317f7c0469fa229ebf7c2eccf38a202ebe3aa78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a6bfd0c8e7d39ab6887a3a3823fc5b1d86f7c2cc0e6a0a398e5252a7fb3044b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b290e8ca06840957424e6b1bd3afd46a6b0e38c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bd50666cf5370a8e88af40a0dfe0172dc69cbfab86fb08625c0b75ceec45955 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dcb8bbeca29a749ac9c653f8e47217cddd7861e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7113f7c747f4691c2a2068c523bd7bc7649078f57b759f7b01f3cfe1b6ce1153 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ff11819beab237c4ba7d496ea71d3e9dc1f6473 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cff5d6cb461fabf4a5d7d6016c9f6bae120ff54a8e4d6ce4fa47a3168453a327 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d864b16eec1bce4197db9a48e091e5e525d24c80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66faee4208bfbac4598316c9a7000b3a71947a93f2613c6e7a7ce0207d462297 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f2678aa245178a671f77a85ccf3a6ba3aa06e6d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ffc02991b67504f8bc53aeea6c68d86d9e8b04bf365c715cfd5b1c1710395af +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6915bf70f573bbee48c575bdbd7f3302591570a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edfcb7329bae5c26a32decb57475003e44ddb3a164a56a8b4b3b2d9261302149 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c46be18be26c3e0ddddd3f131a5c9c12647962f1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1bd3850d6adace044f1ede3a38276a79aba7294f2299f82b507e4ab093dfcf3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0842d6008269dba71abebbb2d2eb1ef792a0841 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ef8085ae014f5b63f147ba6803912f7cc968344d935925c8dae4d3978eea590 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..01248c67a9c0aaf93d09db68dc87dea9ae805107 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42462b8454700025ff30af5fe682047f167b3b0cf9ab1b117865e4a42caecb80 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bd048922d4e71aea8af4cc501236dff502c5d9a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83466431111ff6b01fa87740b30dd7fbaa3fbd9cde16a3a81ca1a089ad08f4bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7923ba427bdb0b682ee8d944004a3a1788c49c67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d785fedab77f9b582a0a52ceb87f04feb4d420366ab4996d4b8e7e2434c43ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccd94dde4894825fb7109ea3d4fe0a6203824b43 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e417b81329dbb4cc074f5befdac80dbee6f5512b7632cb3251f6f36820d5aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28d2e77a007054f9fbb3bb1a582cee066c7a5646 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c54ffbb785574b1867212fc8f8f549643310055fd1561a9cc1e606b1649ced14 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd4433309d6cb80042b57a9d9bd7653e199bcb3a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31db7db504ba01ca235f251b1f248849ef25fd8c418e80d2f1d298d6089b8655 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a7bb318ee30a04462c681c27244a71ce35b5e19 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:557d20592c617e72fece488dda77ec37f2d1625e205322542e670f88c51a0d79 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6caa9c5677161b436fd7812e794bfab168fa40cb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9f83d1545715fbb865729a7fee829076c8e5b963f5c70e133fa1427b70a67e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..68c692a0e76b5b4f5254cb95e3cfcd859991ce47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43904df614caeec9b798cfaf5c4730b5c70630bdc5895626b972d45d95b96ee9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7917da8be5f5b89ad2e0fea9d474b00719b9f9cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12d2be3d87096cde08e7e84ebe016285bf90e54b763c571902cd5f215f02dc77 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63aa71d3cbb057b687bf36893c33f89ba6985350 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c765f1b33ed666251b208e15d8322f38dd27a0814080ba4a0b5a4341f6d6a74b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63b1029addd5b82a9a1b9bac57c337ac6a331ce7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d897205abd3cc0db63cb9256c8a2eba7377e0f982394991db2024b9b3ceed88f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8893de5617f3265e23177d479a9d4552c1dd26e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82f01d6b7e8fde221513c8d29e155dd31c91b73b2253914d3a6c70793628a0d6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dadeaacc3d21df49f3fc77174b65665750fbc8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:534cc2d4914d1b01347c3916d7d9a926d17f6cf4fc3bb41e6cdca7dc7d9e307a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..90cba7466ea08b04ef6b5b1c6f83986d11425709 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f3e605c91ab6dd7058cbd471f37f4563083650b6fac70fbdc3ad8cfd29ad75a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34f9df5daff0099bdedd452f89edec6ff2b97e38 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ee4c5e5ca203ecb33799300c71d0fcc362fb9a51ce6174a8742f04660a8f1bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ac973ac5ff906485b3f6901f622dcc72128448a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88b657b4b8d5be390c029ac45ba982132ceff67ce4601840cbb797f1d84bfc33 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05353e8ab3171f44a7b31742580a4661040d995a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5399b638b83d216d3eb07937611deb773e975f38e506417c681ff0015032a0bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..375d394e6ca00ef63e5fb38865e83d1c581f8b60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b2c0c51233763b6337b89096b4abf7e87da7b88c0be8839291cd39d4acb42c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7dd18870f0d4e710070d87ff1e2c1c670e3895b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9de6d6839a5063c3acefb7199acfa22e043884478db2e00b57f75c1de2c245e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..376ee5a87c07332ddd28e808478f6b2d3d622285 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:822ad94d018f538b7952544397fbcb1f44a626fc97c22ae82ea3f57e5cb0a5ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6931d114caa9376b452dc22f482529154c09aa6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a4e3fa86bad75bdc5085bc3920a5967e3a2af29214daecf531e53b3a81f498 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..609aec176c1f47b9d8bb2b5201d32f8ff4bd5268 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64c0ede400f01c4ffd640ea7b166b4d6a46360870927de94841adc8ec44d269b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..127207f7d937db0fe44e08bcc099a1aa2b898b61 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9559ca364012eda0194d24f6a78bf3049b7397db48c24dc09bdc6b97ced57667 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..16616f90dbc7b8ba9e08872455e6308e07c7602b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a23c188210b962b104b512ec021ee9194b05467031a33efa7e0d39893041582a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5fc307f8c354972030b0f66bf5860eada922e4d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b3a4baee8453a08bd9daacb23bdcef472cf63ade7ce0753b7f1c897a4a1673a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b71734b2fe1396d0f84abdcec99e70d546c0126 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5fb2b94dc9a2b158621e1949ad0c3e60bf585bce1e4b32812d2713bc9ddb661 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a47a6786742e3c0de295ff3754c90d31c5bf8e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0630f4e42e0b95739dc663fc967bde8d25fa33fc52ce5785f0dcacca72014829 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70855d897e25dfd8128acb9ac173286a48fd0b16 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e79f0f8f128a99341f9c003cde537ffd8b7c329e4bf13979cf12c2022250838 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5accf2e12450d078ae4b0a10a836df878ad51f58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:192ce0aff46f3e91341efeb32a4d4326a479a6f516a652ff2d549162f86ad7d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a1c3e72488514881096e313f9bec0e8f964b8bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75f21a2ec76a0d2117e69a754273bb3960ac2ca0acabc2de40d77bfc12031a55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bc22bdc5f6e56c0b829e5b64f72416db46b54b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c522d973b896497aac88d666078bbcf1029b47ed3cc4c697d83e641abd1bf36 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9527bc8762f6fba6791fe9b3f2e697753b4649a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4ff3e48cfc4893a13529d070277187789ec64ac0133ff9bb08a0963bc4f268c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9e91f86aa713aa4adc788f1ddf934035e2520cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:946896c42278c1f119178e6f7cef417553ac9a367a999b8b32396be19e84ba77 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53d61cd7bf382ab46b3c22520d5201b94906a24f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df68ee9540ff87eb55bf87ded4d31a5ad020dd6648cf3e3a0d1e2d135010fcb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd6c890880824614705d35c6da4eb02acb3e1a2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2099ff38f8c3f714a7b0875c559290dc3ba3ef3d4bbbc27ad3f3dff2f97dea90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb531cec6269f9b0dc0835d0e2a6747bcf68f3e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486fd04c7e4e4752eb16ed2eb3e5b229bf74551e293cce0e579edb2b6e2e5db8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cbb618547d08dfbf6c88abd33972dd4099e26c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a6ef1e9cf202d3fe5994fd0f073340619c45e35bf5b69fe4a7dbe28349b0d54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11986e54a90cab5106474f37f1ca833bd5843699 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e877fcc201d28fc0bd33a51d11caa750c4b9304540bace42e46c77a139ade40b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8b10f3007918a7810aaae021ef45c4e80bce1e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e0ca44827ce3f0934890363fa90cc841b6cc00da1217eed26483dd7315b17c3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c81ad9d021ffd67f5f0914a8f2950f48231dd27e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c66cd5208242a03f3e894c7045ce880d32421920b0a17b32a47b111dbe1146 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9bbc76b2cbe6947c2ea172a8513520f0ad6f9c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcedf14d427a56f264baf8b397ddcb168cfe86dfbd8e19249abb1946b2ae73b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbb1d97e40264d39ccf1bbdba4ce7e4ab19b9a12 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3716edaf75cbe9deb5f022c1383c1ca674b14c07a65ceea07ea7f88b9a9c73ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11cd46089b2f545a4799c3d84935c6631afaf9da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00e789ea56882cb6ff399d4ae04413a42fb86947162dcac6d5f7e7de288ce737 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..019731fe45ed48efb9f83b6151520db77a6dced5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4637a4ca7ffc45e45ff5e87f34f0a90cb694e3e0168dbb3bcbb654a2d147c6c9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d950a4909f0c362c9b1384b0474093eb4d5bce84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:737a09ad664216c125100bed05c2a10f6215d3b7e77c62d907c406f6c0955a8d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d7c097dc317512bfbd5ab7e9d82c67b6195796d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd757e361f914edddf85f8c509b966652396ddbb17a5b9fc46f364f7a62320a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ba44d730c850a23096ba17ce751da1b6738970c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c79f2621ea1715b7293dec30b16087af11264258aa3004bd952aa31c6e2dec6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd24735803842062cd68dd00730f1583b0d8ef9a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a28153010b8e3e34df75a24ec2fe6e0abd2b0adc0718d8199eb99ab1b55cbedb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e51bcc8d950be67a204040825fa6683c6093f7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d6c4009545544b9af705d94d3b61a95a801885f81967e766fa787a1bc81f281 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9d043eeb3a4ec04eefef4f03df3ddc0b9bc4217 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24c78338ffe77573844c4f799a147e6accc4e1e2a957f36d81c79c62dbacdeca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..453b057412e161306beef2317ecee91523e44766 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86c9eab35f61430348756ed4bbf7e7a65e645ff30a64fe8471c9cd6a39e55945 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..20595981a2582c0dd3681e40c9354361f081d013 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc27ed3dd874f01e47da4816c058f72b03257e9b4b8f0f91178c1e394dd25cd0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da88b06b52f42fb0a951ce29d93c9603e91cdc6a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfe64fec2c8ed23c926be6dd5e55737d53bff76fabf7b4194bfc89708f22804f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf0a7f0f16cb4700ffa3c01b21ec9a42fb98b4db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abefeb5f46beecb8abf96d6ea4795640b28c9ab2bcf4ab3bb009b908e012d175 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbcab8e96c80a78bd0caf058bcf778fde819250d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2973fb3a5f17d58c6bb4a30c9d7b1c1b058819123e1e460c9a36b23a19ed5efa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..73ba0aa8c5c5abb33f40b820e1dab48501652bb6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cc6af1f84f4e6b2ca9e0289d7e686cb5e0ec52a208a346caac51e5c2e651e3b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f4235967c01db7c1392ec39e5761ef547c454c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c57c6a23fbf94b64e68736b0c36ac65d41f5c693b874735ff7f4ab615c5200c8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..777715cd6f04be486db7efecf5ca9bc4d44cf4ea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:501eb0898321d755fa4434f0a199968fd9b20135bbefcf64caac8d3bac20c604 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3abb68ea0c2cf107c355e52b73239da8367a9a5b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07909b1faf583ba3ba86b54878024a646b52429987a60b55cff47593e4a60077 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52da60b1e251c75bd60527722e93ec679f5aac56 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2cc9ec4a871421dedbe67e1b8236463c2aa779571646015dd2184c21ef491b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c09ec356aa00e8b4bb3c7c4c80c1725495cc50e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88bbc52ea3318b622cc6ec1898b4688c33fbd9a09279ac2f749673ae0b228588 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4c79efa98df8fd181d01334e0d05af65f7b3d27 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f604b186f13d47cb1877c12a37f9c5f9ceb5f3d73aa7aa40d97cc906fdbd50 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2ed9c142c95a5392b3ba468f7dcdb4c0eb186f7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:615f063ecdcca74f44c769872b07c895a3ec0b69cd2e776de09d161d5b650bed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06d96fc21cfc8af4c565482e426da6ae4df60f80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc2c62ee69b52cc7e4a3709623d0591fe4f3e53a036177161e18c43525e9229 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5be898454efe4a04c3b04ca94a56096fa9fcd796 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4b8985d95012c7fff4a56ddf57bb57ec5229e67782b8cf68dbf30184993fb56 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff76742fd3ee83dab7ffb751ebb99ab66568048a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2df30d7ef07c12aea2cc1c12bde0e922e6b5273023332547bda837a2a6a0e7e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ac440068f20ec3ca3457c5ab799330ceb2b5325 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_16/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:852da0094e03de0d62db9daa48cbc6fbae7788abad8eaede9fb527dc54a29506 +size 11395