diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0635d49911ec2362268c6b9cb07adb5ecf360e67 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5f7dda4da518c9b487610dc567c15c099d13a1da79dc86ce4839e1fcfeea48e +size 205955 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..efa56816c34e4cb803acdf666f28e90bafae9edd --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d48a21677241a115836fe8b13b047a4d916af01f30ee643b5fdd7fab0492f833 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86c539dc6a5e00101950944857d61547b5ad6605 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c6b52e1973610d4ed0900b53b13c2a9984cbc0ee1c312ef6313809cb2e145bb +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da27834066a8fefbba29d976117145c9c1d0fb62 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fcc530ae43d606c52f3ba6e3cd69a17e3388e3a555000c6af58bcf0e83dbf28 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73df95982551ead7126516de979ce27b13934f91 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dcc72b12290201fea6a5dc938e0313d104fa3a6f1148cfe8a58825aed94b6a9 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb484e30576604404bf886bdae44cd92e6ce4403 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:577b6a436bde80ea5cebba66284e6c12f6c027d3b507bdcc5f6b28b56ebd7932 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd04d7ef72201ddcd440765834ec075592b15a6a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b4d912ff4ddf78085485bfd097eb8dbd94224be5578e1d8f231068c7204e125 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09edfbca3cb2b3cfecf36f2bbb3afcdeb1140497 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5507da3c50449f154542caa987c5c5fb1c31c5a6591b16c025224e5141935e3a +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..580a7b052731cff25a0893008ead2b12d19db6b2 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f74f52e96d7fd77d1c938bc1267740c28bd53eee50251809539ad00b2f91f5cb +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..390d1fe0dc685f5a319ed779a5f22a62d1b23121 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c058238bc62e924259797ed1a5d7fec26fc16c0ada4638e7d3cb1f7d29bf7f0b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13bede1c862030f522c867608678451c55570806 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f5e2665989350573a4027940e96d143e44c983123a3ddef5ab8f7a7304461f4 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c38acad7af418dace20655c32fb8eb82691dbe6c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92b7c6893a2fdca4de20282d28517fb77a66fd4d5d1d862a09ca4185a60a33a7 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae6ef4168a52d7b7d02efc5b67e55b7d99d5368e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5259e46aaa3b420374efcbbcb9084831bc1d299b9bbd778fb1018760f3724ee6 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de0311ca4a23215ee17244e39be3538ddaed9f76 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18f87e234c34c7188e5e81ca5e985ba39b50361ce080dbd415e2d078ec987468 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3976b8adb079e968cdd7687bef57d9da7a1f6b1c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:197ee31d2f05c168b1f5f7f2d271d0e7c0d7797254b9a5d517efeb549d355345 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5b89bc3a9b096ec67dc784590bb51563734883a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0684752c787af6fd382f081f65e3e46e34cb0fbd3d049d348f7ddaac7627848b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fc361f1db6cc803800e59cf5fb17564f059b1be --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b4a9dbfbef345d6e6e0619a7d1c3491ce6bf28c83e0ca256e54891a868980c0 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1450c5f04f4ac7b3b3bb704b9cd85a1bc7b234ca --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:619169b3aa4b8fd9b4beffb2a6836eb0cf644b4d283289bc560c5d3d257d4453 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..577be73df99b987e0ac7efdf394908ffaa01b091 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1deb938a56f8158878edcb45d62d3502fb9928c64888d3fa0bfb6a6424a414e +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..573a3d29f3530212373652e69625e89e1674cc3f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c91722d88ba86b3c167ba3a3fd939f2fd3f9df109ee532635b8fe77c04701b82 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d226bed85da38e3a9ce94d0f5a660b5d1ca5c052 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a3b0042336e348861841a38a72070acf071d3cea2577de0f7fff4c52652c457 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca929793ed45c24714d131e812a9d5f489ae89f0 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:781e4cc7499b11c225e4ffa192e70eee25a29fc3abfa064dfd62779726584024 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeb8c5bcd33acf129ab011a06278b3757350f830 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68d99e21050cf50201fcf62040c973ba3dcd848659465c9c1d6164cd8b8f86c5 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74d8a6f7003febb4df89efb6adf7ff9cdafa4edf --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e37ed8bd8d006f3216a2bdbc9eece28942cb9c6ecbba32abbb2d62e551fbbc2 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6faf5bb90b7489d6a26313a536133cf2aafec1d9 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0362cae6ca6c29eaaa5a1900827ef7206ed70edf8d9d9a300db6dccd44c138e8 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6302090dbf7b709d8af0ca0d4b6f70ebf06c53e0 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d83354214a494734bd3e6f039e322b5241492deddc3ab1309cd894807749667 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7e919d552957f56b53c824d4465e98539c46df8 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c24c722867630a213b2b32c4aba96c2aae01da0e3a9f9c11eb9c255e3ac66fd9 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..078d8de9d83c447fe7c06a34854b5947d3eb6c0f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6305cf89052bff2485fdd8ddff70ccad39202648314fe3898424de62d2de9c19 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90a90c8d26fa94ca7dc2c3a93b8b1fb884b5687a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd5d8d833f74ebc3d07acfc504d07bb2cb0fbac0fab30cc9e5168c192bb6c093 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e643989d1d694d1f3e48e5aec850e63fc482ba7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf21b36d485857ec70001f19aba0278ac81b52c0b56364e324eae073e02b347a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8660d6e59c0685ba55d696ea920ad838ac9b9ee --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a288665bf61e2ac6e7d18d949a9064c3e14e1721d710e82bcf675891ab17926c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b67d5e1b829d136f7e66c7a7abb0393433a7cb00 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ce2d69712c44f2552f7c028c480bf323972db784093d95befbb12f253854e74 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9977588d7671ff9e4898367aa444522094f35c9 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47f3d1b67a526e4f7c4e2f6952cfd61c70b0dc6f801aac0733c4fb78791fd8ac +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b33bbc5279a13bf7ee5e57aa08132ae3ef97efa1 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09db1408bbaee1938bede1fe7308ffbbc1d53824ea32b3e68cc9cc5ae24cf3b2 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..600b4aaa467c7b8cee457ef1a35eb8c378860e79 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35d85ae18cbfd7d7aedfd641ffc8666d703b4d482e595955f980f89363f51f28 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99889d33513a68ff31282538a08f74ec65336981 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a01d0ef3dc0b8f0942244ebed0a9e8b0ee2978a2c3ab3783ddcfd3c708bcee59 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d40a096207a6be48eb835a9cfd4ee5308c01c5e3 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a332306311c03470ca7e060c7a389fc6080fca6cc714d131cf17a818fb36e33a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c1a8424263f2fc2dbe85ee1baa400064c675a91 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3ba3ee988b022c336e8e425bbf0944432fcf70113ed889a61b56102a1aad834 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d14879c9f1f263402ca1ef8c153f04d229f37cf --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b6d11e361b815408da7cc45bdd3a6f51732d0dc2aea90bbb29028d77548a66 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f978ade70d29cef174fab79ab6bfda70abc56b9 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97a970d54f87eedfaf76660ee627ea34138bd0b7504aeb3e4af48289e4da7f01 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29402ef469e1be30ecf4b7fd6f16db9a6242cfc5 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11acb470c4127b322fa8880f416f5448b41a1cf14d98293a5cb4fb76a6b8172e +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2432a45d487c3096804ce8ac2dc3235fad3b0bf4 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:161c8371810822a4d6d403f38e1e75a30e682b708f6602824b5fc0d480c6bf32 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41d652995d1d43f3f0fcc4c156791bfb63bf21d0 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:646220168f5c140433de689b5a5e52b3d5971ba245b594bf86f7caaf80f0b045 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d9574e55b8e0c3314fb399e86d92aecff517ced --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9faacd054e5be373f9d41e9ea7ad3f6298a288456d9de1fa122eb311d8050fb2 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a88a4d3124fbfa12a8d5285664a4b0ccdcdd3750 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:927911fdb8912785f165ef4a3abd7d72a55d3cc2ff0f3f4a65bd573b0c549019 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a7cd6b7f649d612c7f4fefe4e44c8f7ac5ed3e1 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92d39d3762b49f3c6e00b294fd7401e268db62657ae535c13bf7343c6d331ce3 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1ce0bbcd9c61eb0e512f2597bf3e9ab7c272081 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb555392dca44193cdc6a22f91d8228f7bd6fcdc715b61ba294f307b499e8e5d +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96d001871f2f9cb97f51213990cecd67be43f052 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd0c0154f8a524b1d2c46c3b4912b0558e2cb5c7c610b520f45419a893d9b98a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b1d8512f4f8309b04c66e461beecd2ab85ac86f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:318be03855a526881539570f6e172cce61788a4ca03efdfab54197281e682060 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22f2ec5446bc9aac3aa90f3957bf855c3ef2852e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e38151899636a630a9bae9c98eaea4cdfa32fd1774529051579ac2f26f59f6a +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6db7f6362cc373ac950c74ab6ce886b132013c91 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42adeae8e6a863dcaff9304df73932eaf926a28e4e44e10f34192038fbe9acaa +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ad6dfa5b364977ecf6b4ee2df592a5b79142a4c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:120a227a9b9d16ce7f2e73ccd16f6f9f4fcecf49239dbab59c30b6dfeaf0e0da +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66c825f1173dbc8a9fe25796e464351c6212898d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:507dd36ad6a5389b9709ebdd229c24fc7e18ab10f6ca6192fd0affca44fd1edf +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a58af13a9189f06a172985f2d1240a7ded9f1c0 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a165e3cb63e3380178fbd793f1cdd20168f9be596e79eceffb34002fb660661 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c19abff6fc7fbbae9abce64fcc6ecb8791d70c7a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3b224ad0fb530e22ac7c2f3f6b166705d8c3c176cfb3a9ef38f99e2703b708 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab1db9c64b2b382d29f435b84e7a434a38d5e447 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa6a61daba77d0191c0176f0453d1cde46468badf339cff1d77c16d46c20990 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c94335a2640bf8c8f709d9980705ee8cc6787d3 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c513dee0a4f82aa9fa242e11afbea0707be19ab128bf880d757b716ac5f913d0 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ca429baba0db8ae66fda2fad8852fee6999b7b7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6055433b265e179a9fe63dc571fc80484fe770bc8dc58e27e836e68291d17486 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7ee10b8c8efed955ba19abd2c67b79e3fcabd2e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ce8c60ccf36ee6e773d5461a19c5abbc2ee1af0094e67aaadf8610498707eef +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98d85cd323b71a121ce5c0b073cbb88245e5b9ed --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2d769f443e48d935dfc07cbddf8253cd5d9882454fc469cfde2488bd2cb8ecc +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02a23b9e3a407458f1cf0a31a15aee2bea982e45 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ada01ce6c4b3e84375852b94b032cd41362f046c9ca2561104270330021eeb3 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0857078584f0912d5e38320386fd8d8a4f4588a2 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dee0ae82f97fb9464c7897e4e770cc2fdcb20c4fbd1048c45d45a3bb78015669 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2c77b14557b511b19611516911a843a7dc1d8a2 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08ff585153a1e7fe696572e2d0ae3b3246f67fc029415c7cd2fa4119f4c75cb5 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..261d75ad36793d32a8db0edaed6d25015fb86fcb --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a17845b1e87df6bd6bb57837b45d1e6166e30126660bf5f425f83243d7f3cf1e +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31be37970a635a4be9b6848d66b015cff092950a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:182f05c5b0d65519e2bf34fe99569ad56cdb7c56054bf113a5bd96ce4ebb6bb2 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8c01ace2028b4a43cc3f217ae20eecbb0dc7bd4 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b03c5620c61a1556b4cd7ec9112adc3e4cc9ea830494355fe367af530f479a2f +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b24afa4abee593ab52b9148cad80ef257a1ed1d4 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c9c70efe0ce087e132728c2a75585050ae8ec71d3f95b33eedeb7692026b657 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5861b53a83384c84453ffbf5bffd7170c0e6ade3 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e64e5b3f1c8dacfa7a1f3e67b4a510dd458292fae56a035ad3ebd326ae88b635 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c6e531117733ecae2dcf0cb6ff535893cd7e8ee --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be85e87834b47ec452051059c326fd78af7ac7db027ec3457e7318052843fac6 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d87d50951dbc23a3728373e6e6a465c81a0f3109 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:455a925cabb14351b24cf44fbe24e96d730a24ffa47530bdd606ec8974ebc88b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d284e597d61405ad009699fcc58d1bc3f27f667a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aa5259234b410b5d8472a51bba8ded01816e58acef13d8ca6370498fa7b2b5d +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90a136d926b153214bdd0d7fceffc4f852eeb406 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a9a2195d72685b1974ae629cca1fe0c320e3bcdd0f17c6f187d3779a12d0380 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8e71747879eacea037e5ec7c9abaca1fe45a72 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8d4af28138df81063e376a13e83530fa0c28118f4d2819973514ff57750433f +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9cdfc592ca6827ff13b62e6551bb5d4735cbb9b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc6c16df3c716f917ca70c7fc7c1124274a36adf0d2032e68339720a604f54ac +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a07c695d394bd546e7c94b1879d6016e7312bb96 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05c8c916ffce8d2b6cb7ae088558d36347eee3c6e67c2ec20200310defd5101b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a024b758ba9c378166f3fa207d13d4af8fd8a863 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0f3f15f46052e3d912a3d8721b29709bc4f439988a02d94e06360f566668cdf +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a18c69125b7bd2650dd6a721a07214a8a1bc298 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f14ebb12fe99307fc0ae694de29298b701f72d103bfc83bfd818e74bf041b78 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..332931ba4c93a703a770f982688e9bfe605cb0f6 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90f2091feb44eb1257a343f1664071dd4b21fe652b077ed917cbf7ccf158cca2 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8195c2ebb372f8497b0c445599f18feac187b6a8 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:988de7219039422a99cb749331c6a506c1c86e2ef4eddd829d244cf93a202f50 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..913c4295e9f6d399a9cfca5f17c6d2cdd449a24c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ed78dbf6f3f38b82e919ffd0a093a0942178f9e5a282f6658d97e5ee4002f4a +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..401c2a0f43c78ada7dd0c2b5e8b6fb266d75150e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d6b1c19cd7f4355ab277935e585364be6856b56dfb401cb0c2868d26952a35 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d95ca3e7efae871e5d3cf2ecd0d54a591ff84ba --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9d28c1edc0d3022745dc6ebe92851966eee2bbc65a85de12c8112ed14ff3818 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d8b121d34a2804be1a12bfe38de1abe4926c3ff --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:419e888c7fef50a56a8eb3326b170406eed6f4bbf63925dff8352c11825d0519 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1740cfc63905624fd6c539b1a51615590ad926aa --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:739f3703d748703eaebd4df0629de3d33643159c42c2b493ee540f9d4c278520 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03934cf0c2375baf5587ce1d3a16dc86ee8cf90f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:565d231a059e4862241e90bc01627789cf7b8dadf6c1e7722f580426e62aabe9 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9104c9b3af60f2317ad9a22354fd66d36ecce91f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:745f960a29e89b0213aedab53e203295479fedb657e3514dd3388c19fe8a5cad +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27522dea9d597cecc24300979d4c1395ed0645b5 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2adf9bd26cfba9cb04853f6e7d5dba57a339f85733ca172f851ac7462618446 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60daf311a94a51ccda8f87fb46a07c6194d5a43e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecafa14aef6b8fa7fc35418179be94a93b62529039cb3e323fb4a4e0f66b7ca9 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae05f11b2a03cb428bdd261d4d058a3fca9deebe --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545b3dc3a558cfde081fe33e63274298fd2a929f72866d41200bf15043561663 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a39b2588a178bea0dbff4da832bad618aa150101 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30983c8097ccadf77ccba9a282edb3120e0f96e11e1327fcfaad814062b5813d +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc6bcf1adf6752bed8b28b7bf036baafa7911c9c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d963dfb31fe4fdb12253d5633efd08adbac96e859ac8d08daad4e509e15d3e6c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f4a53f08386bb7465611bcc827764e165d5343f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c933bb8daecd6b01b7f1a5d21b2c3d72a393cfb2d93a9aec1ec499c3ed45443a +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9070a811d2e8473fff5f9fb07cb76dafff46084d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06573d84cd3178a112e237024e888fa1a8f4923bb9779f3d0b0b77e056f6e15c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06ae0e46a4c3c43adeb92e2682ec4f6745cb40f7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1460978433271333bc88439415bf5b123f621fe705b9e55911fe77fd9c55cd31 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d4466c62d8d95e7161e8d3743282916cc5aa7ec --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fb45a99f65b1a255d330764bd994923295b2cc2a0f86d47845571b6e01e8cf8 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..582be482128f52da11c7fc3efbe1a283f901ba70 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f966d5b0555c5b6cf67d6176b06bd68431b7d6da24539b57db6509f2317482ce +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddd4fbb72cce44db8809df30b6bad451d343e3fe --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66292944224919acb3e3151ce03c63636998be34252f623909bc467101826ecd +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87b2b172a43d68b204f4c24be9ea00f8a14f09b6 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d8ef661d7b93d8cc2b5ca1770fb4e08e582cde356e6cd99850b8849c4ee4791 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80b89ac8751d89172578a83248946ca5680c1604 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:861d53d3a1855d4607b3ede39a614e7d63e80dd70cc474c59d1d44fd5dd5c6ec +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cef49f31d2dd6b11e9b6d60e1debd88a6de1ea1 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4003e6df15ef84771f79d79be8ee283a23d9c56d24923bf85044c814e9750d73 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d6b0e85b8127018e88e26617ea5443b6b96e8bc --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec35b71f07a710f787ebcc5763115e7728d74565a6723c52b829ec29c5c48583 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0316a9def837ce06248b988f6f989f95b94ae545 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fc14f4f5c420b0af6285d5b10c16612cc20b740243a823dbcedae2e69420c39 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1945a7022808818e4bd9cfa07010c94da506fbf6 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bd2c7f148fbb28af4b2f0a7d88c60d82d2d2c6c88808e49e43970b4069035cf +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abc52213ef064c66ea70df129038d23f934179ee --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a9a2236c8ffac07592495b1babb31d4be1addd081f2cac245780002fe9f7d8 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff136faed091544cfb3c749281c0f62772f8d80d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1260d0bf1fafb2499a2f419bf6594b5fb63f82d8e5060629262b86776a2dfc3b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d1fb72777115943b16273d5fd63c717b77f0439 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46d9bcb75fc46d7ed2b78d0a452b22c93a2a20788faebb591e7bd61b2d6e7902 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f9bcc6d63d1479c99c294a954e719e0b960131c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d7345245c75118e266fd04f971c5cd776d36cfcf320eab33c68e7c4a4de8407 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e949d142160dd909ea2106d80d743b2733125570 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28ab712003c755eee99eeff6410d91768e56f28b31496735d46cccecdcecc049 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f907870595a4da687b89f6d851c22beb1795a29 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca5d4c755fa67aa92c578d31a3be20e4cc7fbc26ccafb05143badcc0d26f4ea2 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..320af291c2c722d0dd7a87d40b84591af5e8775d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb07e9ba1009f81b1e355f76bf614867565d596c6f72da888c1fc70fa08915fa +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c983bf9487346fac32a5a6209bfed2a69bde474 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a80c78b97fdf67612d7bb97a6dae18de2f6a29d59757f52d0f0c694d0a8d7d48 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..964fe5181cea55900816cebf298abcafddddd6a1 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23e36378ea50aecfc8656432d98ce2f945b576b0bc44a841709fbe00c831beb3 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf841cebbadcf29a86b59a710038a920c09657b9 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a90bc0357d85dd6a8dd1ade66146fc5c050bc631abdc852e38091e031906de4 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b63c22c86a9b9721bd342f196bff30dd60398939 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c935967085bdd1425dc6d66a2b5648ad26087698a7ef6fdf9dedec4e62e9f1 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55414c7ea02cb17c1babd92d215a7efa36436af9 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e664baf928b9bf7e07e58abdb921127f4a4f27a1e0b19d341be9e6b7976a96ea +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..482c97e38b5ef3dd76cde84f2ea490f1472ef04c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3231d277f8a4cc6a1f37052df670b1c98c7d2d62b4b7af6ec81a47a6950d0b99 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55bb33aa25b14f8fa638d91b16f1896608ccc637 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae68c34da76dc814b9163f6e92731e6a4f433bc69cc57311cfef8bd0df5742b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1819e2521e9aa0373809bae872016ba1ef8890e0 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0329dc62cb46383bfc15bb5f3199f375df302b2b10520745f92df9826af4e899 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e463fe9e58a110b190fcabbfeb626dc0bab1f535 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4303c118036ee21d3216b1bad5b7ccb3d337a7ade09bdcfea650cd5248c6c57 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..597ad88944d9448656e45b081d8994a05d7c87c5 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1d74abd03a9a13b23cdca8e552313b0b63962f033cff240184b77ec72ee484c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a5e2521d8680992476484159f9108f7b414f2cd --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28962ead6322896c30934dd072fa49d67d1abc61202530b170047618203af652 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5de093c73b32132bd3bdc5b75185b752c8337a90 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a0eacef4a731ed5e27c9112a923a660a5f46b4a667423a7df4b7cbc06ef97c +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a858bc7483e601ac84ad98f6bbf06a3c1df7a98 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f73591f5e683a967cb74e8469088e468a66f8abae99d9c526007ce6429ff98a3 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95fee0bf048ef4d1904df294051ec141814c1777 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:278e54c01c38335630ad4da66e964181b067cd84f852dcc9f5b92040a65609cf +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d49330080a8e73dd5cad57aae5897e55e6697f9 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34901539b900e7cdecd4b39e9142217124f5908e0f13f6e13af41210a6f10aea +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b983fcaa9e0209cd4394572774519bb24c8bf16 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3842246d09ca5a6a6ea69ae15187c3beab8b44d64d55c040fbad6a7b83e5d25f +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e0ac376e37cf45e824031246b5ceccd6a51f186 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7b066f01b901dce2c1de1235a742c0524dc2a87dd983ab50a829f99c1c96517 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58076850e6165ce5f2fb1f196a64778e54a70ced --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:586e1ff64fe0c69771a6ea5915012d8ab6d5b5cd1d3cf0c83ff79039f6c90f82 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aed38fd6fc0cdce393637dffe3d28916925032c4 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a10cde8e3b2d06f8ec07a96062e1abbfc0eed630b83d19760e7ea32abeee14e4 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66ba88b12d46e1993ca936b69aaafe7f0498776c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc2d813f35fddd7c1c5f58a985ece3550bd82707a81635cf3070bacb1e3665ad +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d2c6f0414a584b3c425e6b81597be5ba14cd9f1 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ceacd1c150bceb047dd8395553b8121771775fed849cddc37feeb61c3cf166 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ea56c4ba822dc243ba20072fbd8bafb9c5ae443 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2d11a4f4fff00860e149f8faa3fa26f6a5ef22d3a047ee45a42351c67338fe8 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58c951203959a9f16371216674542f7120de6689 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf25756288338a24d01b1ed7c09a4af4e27fabc3ec70823a939ea3880af9c4d2 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9840f53e69bad613c7755b7270d0597e4631e5e2 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c90b4e6d703850612a58072a63304fa56d5c1e60578f1870f277a5820f904da +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5b23131fc616db16afacbc414d7543dff5972aa --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43adb74e47ad2c32787d9a8042727806c63ae18113323b989d4e71f49d483c5a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..488f7125405ff707ad1b1e64056d0af2f478a143 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad00b2f7021c7d19f865d63d550f77a93b2b5ff9639b69e1350fb1ecbc810e81 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4137758c50d7997b7951ee2386d3fcb3b1cb35a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b56d2bbd97e2a64404ef479b02faabaad3574b9727f6aa0d2c5863de5acaa7a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..601e83caa94da53f3b3c68e878f3bf2707eeafe1 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ffa32f64b9ce7aa95c34fe055cefab85c17231f3d69dc373aa6b49d12c6be3f +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..383b5ae758ec4a6139d9f8c2d676123ba337519e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce8f594df105fb00b4a78559a363ec9d0414d38b87d7aa60436106a0fb50cde +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2b7ebcbe96600319c1f43a379c1f52262934f0f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:479037f61802f5d09c99277d45880ccb1307247bf6ffa946ac9891baf79576eb +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a74879baec55ae20842da082ec0ba51dd2e4386c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baed88df718cc82102307ceca8755be8e9163e82427fc3ada7e2ca01647e61d4 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db1ba0f4e23c3afa36c23d24d9d481c5f7678ce4 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:138f1bb32d7e596a6297bd0ebaa5ff6b913761eaa3bab9b90e6af6171f942c14 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac2f206e3c37cc086cf490cacc0c01a014988a4b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd52ee7dd84c3fc161d5f6c9d8e8c1154d30e8d3ccd836db5f080e7bc3a67f32 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..867ed1ca05d411219950c789c75778a2c882fd05 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df38ab2a60c9c5a7480a0e90640166bd6a6a4a2f6f5531881001824668943450 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbed26fc481e69e2c8d5168f85a5a1e8952137b9 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ddcb26f098746371a99af910dee3d93cbf6fbc89746692e84fefcdd4fb39db6 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9639934c21ffaba234a2d633eb86b913ca935775 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1594b9d7a99fd5e5fd43bc6065822235948bff0cda3acd26c1bd4d1cf8f0f1c1 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f70bb23aee592b41ea5e8f726d05c8167e954588 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02e738c0ce2726473ab033f68e1c6edef171622c24232317d0e9bc323182dc65 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4727fc503340f6c29bcb2847a37125653fa16e2 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3b0f31a267fa6d9c1e1d8e90401006952aa41502fd89eca54057803017e18b5 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d93a2fed99adf24c01da162e33a5f67c88ed0891 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9067bd4046f58eb7651a80e3d0a9379a17f6ea124763d961e7b03ad75ebec19d +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b85547cae6105c3ade37c9ee4310585c8e50bca0 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0331c0a2699706821bea44db9f4fd71dc017551f6b0ae1ef121f3ed30a6efe0e +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12b18ed622790d5fdce6f03e529a36d4a1490bdb --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1a768c8b1af9d704fab753e0203bb9ce84e4c3682bd810333c7049b546ec6ff +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c17191905db9a324e8ec7bbae9730f3028689b5b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ee7fffc7d62a7b56536bf08a8ba964249e86818df0b87ebba94e4d0455131b4 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97e23c26ba0098948ac7d217c6cde388c8280280 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81d61d34b8083c14bbe780300c0e135654d0fd655edff86e1b7c5164fb33f934 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b75229ea7ed99ac1bc577151f999b9e96b368d30 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2a2cb44853aa07033d411200327c9a6a6b1c2c037bb4f703388b69938f46def +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b1aacd28cb511993bbaa30484c11c0e26c2fd8d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7435f50898d359662e39a287db352016739dadc59e93d1e9030f43f84ed1715c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc3e4a3a8fdfecf7f6633fc0a8199437e912c6b2 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:370aa384165d2c76db6138b49ef4d066eacad864825420f008f1b14651b5330a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dbae8fcee1df45ba2894c6c2c005929b1222e75 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d907d2db5bf008e1445cd2ad0906bb4fee90bc6748bbf1ddaa0bb80639e4a7 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f02114f84b89033f7d49eabbe4bcc86576f587ec --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0e2d4427b60609960d8734a1e5ad7507dcaa806f9c3457121a1568b259a61da +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b62e9dbbfe6bb6611967231b4ffb8f9deb7fba6 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0f7bfddff37acc42ca8e33f528f0c96dfe7f2962817ff7bba46c721526efda2 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..740fb2b81e64243d0b76d9f730cc136880eb1ced --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad01d86c66925099591518e660a5ecd8cbee982f6bdcb7798c4113d8f3624fd3 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..daeefaed635ae5ea8d6ecd9a03f64fae7af35004 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e13d0315b92d42d2d6e0f47b02495c597e57c4e7171d86cbe6e14f64c9bffdc5 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60087b85916f2e9e03bc05394707daeaf3c903bc --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5be78633659a3743f7035dd65ba37ad6d718fd7ad2353951087575c30a62aca +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..190dadbc4c06b88a01493871a56810fd3cb72c09 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9016198967496687a43a9543fe596fb80adb266d22d5c30c041765d27c799e80 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0083770ea1e1e539f3c4209e471de82e90839ef --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdddcffb82d20b4c09bda13286108bd69f97c3fe739e5cb6209aa0d75708f743 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6746c2432fc817b11b0e0880b36dc40d3f736b41 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb5e9e573ea8fa8e559e25ce2e13e52e77af9c2cfe9a52cbb6549e7b0ed80645 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..006d936439030c50f65c12ec697d529abdae9a93 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02c41013aa8f9f0df370f337eb22f7325aa4dcff4476994ddcbcbaf01be6cd2c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47eea13207bf6d4cb6514c4b92d658ab9dbc9c22 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f3bf33cf2ae357cd7b471320fb3aab3c2de4c8ad6b3c3c412d8df77f7487b26 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60779f0e88c60e5116b259fca94b5b9ffb828210 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:394591ae0a0274de91157c9d78585d0aa4af906a2ef9b541d9a2bc0e9b26d86b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..340e3654fd9efacea7d8a19bdf3902c2e75dcbf3 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2268ee4a7189961da4e8eb159becc65d9be443358dbd726fa7692d9d571f363 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a556e54232692c7b4d64770ac354448e22a0918 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53e84b851a1b8ed8218b2e58da417d905c9be83787c84b69f13f476c913d8690 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..808eb3b18fa2c720e21c00155211f11a64e98918 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:372d7ac07ab89c80ac9d8bef9d4f7d76450d1763a69d15a768da71906bdd89fc +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1a365a4f695a09205309a5db0629c2cca403abf --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65735048906c2e076b2834a4dcb7327bc077823eec2d5507ba628bc5b798ea21 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cca01d360315aa7259b5b87d00c993114c9e7a9 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:837770d3e2626fe11e048b98d07a862ef873d2cfb4044200f48c4ed9a2f13ddd +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..35aaf1a753f4be4c09376180c5312527bf63877e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff4d93e4b59e86357532a0ae49c9402f79b0551ddf75eb15e1eb872249a05ede +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab4d4126cfc2317c3a1dfbaf693a866470e2db9d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf8711302cedbd9da7bda4a76d817ec0b1798a8ffb0e1f8282f2d3ecfc002463 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c45eff5b9dbdd0bf034c1bb88eec9dcfb5ec537b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9d745f03b6fc203b8888dbe7a910c1e198254cc0ef37994ff2dbd1d3dc06b69 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a196ce253c0e78479de713ee1f5c32be91602d1a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18cb9353e834e1caf769e15151ca1594025ff1abdaa3d920809dcdbcfe8b3b1c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9fb13cd82c3abf5f9d759bb5c5e0d0a0a7b262a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33e61568b9b8ded44e7ada8a52b6bb0c826f775b37c692fb02a8f0b2fdf6220a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c55e5ec72042e42fe2e2127d6cc5984c383e24bb --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40aef839da27dd65e8053e70d73392b10fb57c64607bf56599c45c4448e8d2a2 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf71ba0081ce320b8f0c6ce088266f38aa28dbdc --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b15ae520b41e4b284f3a209a853012977f77b54537f79892b018df7e996e8fc +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73e8cc150d232ecaaf45a4abfd6ae8c4fdfd198a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aad0e68985cea1e6273a36a0cc370a8f756d1984c5cbb76f8e29ad5d3e7f3c3c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fe683433fd3b1ad23a6f409e3c6794e13ffa078 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f0ece160ef1f6a7664714aa00532a2ee7fcdad77b7101b88a61a07dc1cebef7 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46036fe6f16f32aabd29194648c4d559bfcd888c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:346cc7535a4d1e472770e958d77531fcc7af88753bdc6326812edf192cb25be5 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e858c84dfca24552fafbf56b632bc22db21e8df --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62791dcdd583f2f39ee23a30d482ceee601c3901caf37211b7319d1d00b1da9f +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b53748d9805ca6f2e5253704b6a3f3b72205709 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37fc8eb38ed3580cf193ba24d5e56db17120295f933628291c0df04127b4c917 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e58f23eab961ba854ef2da958049435869033261 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09d20e9e1e94880e871cc9b7164c89ff985750d35336e76a06cf2d61a8529ec3 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74af1845a7c8041fdca2f69270c54ffa3b8a0c97 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9d4b4129959624e1bc28c2f8fe70dff150d8b1c0b12c485c5d5315034f1258e +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b11e0d85039fba2765b5217cf652936aaead96d7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ba52677b0e28d31707cfc26570f9d86bb78942d9f84fea4016699d8cc47c6e3 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ba8335ed16bbb5062fe726289a6c29cce74a6fc --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d4e68545abcac4c630f02bae32529aa94dbfd4a3594247df0a94dbc0d7dfc4b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74c675293fcbca0cb9923227b0c405a0bd0f71b7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2762c5ceab2202da2c25ad4317ba811a9079a6a50dd49459abfad6d4ffbce3df +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00912e8e654ef6506bfa25bbf2d5996fcb9f3f1e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0a56b044a3f5b511c0f4157a49730f167cf5636f814366882946f85e59981f6 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..652f24b94ecbd0da06536a464fc181cf512cc600 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:480b1c9212c8903a325ec27554138030c81989a51237150cb0eeab7dc384145f +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1beec88720597c96f083c007522baaf151bbbfc2 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78e8f09a65af500235ca9695ea3573871cfd51878aa27af95694c6a5ada64587 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/lm_head/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82b12abafa2259262b4a86142cfffac691d19590 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a56cda079dd3e6c013ab4fccbcea66e66ab07c075d43a14c1485d3cd42e81d5 +size 205955 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fde440fdcd3efe775d845f84da8494077711adf8 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a238f6d44cd69256baa853db2ed7033d1229b141523fd9a491d16f1cc40f2458 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..488e73b4db867957a45c1279893d7a0dc4784e72 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afb5fe8c9fa5bceb9bd5291d72424ce24cb0b3a7e0f318ba8d2bcd611ba18e0e +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be151553d7b12e1491cff8448ba8f2949e97a7de --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a475ba3bde2cc1eb1edb451d76125a9f50a2f4134e5ed3d78a6deece8373ba4 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c39d3e693d2576700246de43755e07a3e5021919 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13a48288140b7ea9c8d273a2096dd42c082328f3324e68ce8f60d99e430c8648 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68f02be5b4bff60f903c844c0eb93af725a2967a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b464081639818faa6a9ab74984371c53458bc37160c42e1b46b398dfc3abd010 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08d2b9a2c02fdb317e7726c0a611425622c4066f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba0f3757d86fc6d3e98fc96848e65f8f5705adf4a3dda4f67094ce5d8543faf2 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7ee7351129d87785389c71889d9550cbe718a68 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b04eefb78ace9efba6ea73f52711bf05ac355feeb57e0fb5aa7fde2bc7d6bbef +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..416b6d1df6f24d1e41523b72115c58226acb6693 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2d0b744df11deeb59fccc722c569562d1c9fd239916e322f969f6002b8ae109 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2084313db64f1a3c3578300780e06d9059c801f7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8571ade38dab4bbe84bbd3017716c206995ae8157ce6e9da63d07773cf220467 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..237002092c61e79fb592d1bce0d4cef35bc513ad --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bae80d391db2cd7f4bc28bc8faf419fdaa2160da4540a16f97bc4cb1e26aab00 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4aa689e4cd1dde4cae58fadeef8693ac2ced979f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aa972758130b1e594967fc77752069a69a4baa0ec62d7975c70011c3d9684e8 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29d853ed6abeaf6b806fe3275d4058bc652185f8 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca155fb0003655f929e845699aba2d9572f4bfc57be0a7b77d1103759fe1367 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..811274942154fb1bae4b5868e1fccf63bd550877 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:925d6733f781fb5c2346159270ccbbd3aa7f511bc402d232431f2a1d4845c64f +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c56c2858ae1db84b1495793076a1ef01705f88c8 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51290a9ffe7845eb63630a3675584d9e5796edef340f41b767a4c3dab2b135df +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a72acb3636740431756bff0ad778126d57af90b3 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b4536666ef264b45d5451886076e0b84243193777d0bd4ca6001e29f024c905 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2584f80c4b8f35a764f51cdf1101ee16b8251f92 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:106961e1325977cb86422286026d0a2b20c5dc78126a462650ae606a9cce5870 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1473543fdbea967ae5e2d915c83c29d81560e894 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e480838e7085a8d97dfa34bc7dcacaf8bce49579d3837d2cf2fe61505cf0987e +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fb51275f29c8becb3e93e78ad523cc6ba159434 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ae1a34a3778df4deb7deae1671267088136f28c9fb8edc93d9726c58f5e1ed +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abda85634092a0e6994369405a32dcc045a0f129 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80885e5cc4a639a621c561ca0b1675f1af29b35d72f59d26c6457111934ddcb4 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15d0d63d5f57cee01c5b4240f3cf69d63d1bb7ec --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bb0273d1cc1e20e818581c0c45457defd4fc6b4f784e8d233f8b3d441cc98ca +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e46b2a93075f3282b2943947d08a71f86554d8e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71317f534f82a95427b8d67fee82e282472eb1c1b2372f2bb22cf7a40f0f4904 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c297bb38922c61acb36332f04cce3d5ac298563 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f96b192567aefe6a3d7efd9a5933cbec9673d4d904d7d8d8cea592a713f4795e +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b25341e08266f0a04b68826a584f02f0ba71c002 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7782ca558c1c68254f70883e4b1b5205037a686540dee692876fb9d54149c837 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aa5a9f2c17c171ad31904f2ed6d8006a7d1daa6 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5210bde5ca71247d97c5af41334460aafcc0c2fdddf5068935353d3aa56919b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79566dfbce8fe13feef3c38eac7babb0e5283393 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9c567b546abaed3eea358042bcd8fab691d8411c19be59b5153ee685ed04c67 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fb8453ec5f5f088792e5cf4866f5562a644ae32 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c92bebca315e2949fa4b86fcacaddc38469798e701559cea0978625e15957c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..544dccf1f81abb1170b1cbed51e8124d5af92159 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e59d0b77d938f4ae2970010c0979126ba0901c566764fef329028b9a12d0259 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b9e0f72ef422d234d629ae3c53e7f441162f099 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:155bb4c6c27abcde2abaedcfdb7c847ee3bb60755bb08b0943ba569a9d9a7fa2 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40464571ea891ad1adc481e31d9605fe2e7eca87 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2145f7d8e52bfca092838220e65779f07ae413717e72621f349a219b00b0b3a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e22e7d89af0b1f1d50cbd074095d30e378b4541 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b55810959b109c4339cf49c28f55f875efcbd6624b79668f58b1ae7eb12005e9 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59368c0c1aefd2a37b743d04b89ed3b6fde6d30c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9df23f7a801685a30059c3c8c1908da5b36e9563553705afc2e983a013eb20e +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af3647decc5391d1b001465611577a766d3610b3 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9eb6dbe7473f09964f1945125a46f777c4962a6aa411f1cd15ecc4d2426ebba +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..122c8b09885f872ac9d1c9ad850bd7f9082a5779 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acb20e9f8f9946871de174139e6ab4a83223f9e0067839030d433f21ebbb2e16 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c325291232954ce09e257f4f7efeba1f371532f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b6d41c4a5d37fbd94b97a4abcc7699f8044a1d843553803187d8b0a92f62776 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94d96a0879881f69b05afe927fde54f4e3fc0a71 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54b77778e26f6782fc83ac4a7643b3306d6f84f38f27400d4e7cd6b44a36372c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3162d0dcdbd709e50947e9df196319612b4c2a27 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea66e23277ddaf53e8d7dfaf2174d973ae6dedcc89b4c21e97b57a028eab6e9b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..718756fe93fd2fcf40f3db6f638f558cbce0101f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caf57fa15c3a124038d1b056a74a3f5bc089fadffd2f8431c5e37584b390593e +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e60a779dc2e5a0c75f8860659ace8fc298a64cb --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d8735a4b2c10cdc999b00acc83c74d2320b7f412ffd09966251929ce004fae0 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c4d619e91ffd740f2b7ade43ec6a9373c492cf2 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef364da2ca86c1dbb7dacaf8d9e38e4ad1cc899e4616fa15ada3ec3990978a09 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3deb79d1d7df12241487fd3416d0c29156ee1cd8 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb854c4ee18b15227bf70301e24fb4235aae35fda7d422e1ac67fcef88169435 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f82db3166ed7939aece13ee6c7f97836cc19fda --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77276f97d0eaefe73e0b28f0fca8e69b83159c5687ac858d5deb6e8ce4ea2142 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56750b584c1808301f0b3f0d653f04031145bdb5 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46db628cedafa96173c9dd26da35f719734082f164233996d5b46a918fddad29 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b58e23fe552ce202e4556823453cc45c30d81e7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61cb7f95749f4b0218622758f2b396043357af57467086f1d5bbfea70a8da2b9 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c9d21d7f0cf1027d54a7256e73d104759d0caaa --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed7131a3a60b2ce88647f42dcee3337bf1cbfc6114946006ef3ee71608a14638 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..996fe8a045ed0e061c73d43fcf5d4b3adf536ce2 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1620505170e8e898c018e1033730742ff9893c3689dc803e54b19f0fa6da04c6 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58934a9f110db843bec79b04bb6660a86ed9068a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39eb50685820d8d638537a73a2fe7fed1018c31cdf58f9704cdcfb6339d844b8 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc1bc5139d3df7e33c65401f740c0f6ed4585c96 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43c71765ca9dbedba71cdfed0353f4b66ec60a0acb6e58940f77ee6d5dad37d0 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18fef8bdb8bab86d3535d3db70efb40e97f595ac --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c3bd435cdec516ff4e066d65f9a3c3a32fa9c837c4d1cbcea492b2c11e81cac +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..809f3c2338d698954cd8733c76876274efe96165 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d46f06a5713a09b366db37c7161f665318815f01f7834bbe30dcbf41918a416c +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eaa380fa9d169caff87ed1570f71a79081455ce --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19b7641becd4a4601fbc51db0b4ca9382e90b36b508511a617feabe990f9fa82 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f54bba742702b929b94c949c219067c61dfd2df --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b5338ba543c51827e2439d1916ab61da0ee26570ec2baacfd814495d670bfc +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..acc5ad8a5ab1678d4037026f638185a49c92a453 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fd8203e8acd13962590084c884a20568e8ac6e3b864d2a811d0906be5eef0da +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32beeb742893015c26346d31c39c3cd23305652b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bf72553f002aeca0495b86faf728ce270ad29cad3386de3b32b5398025e05de +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..419431fa853f1990f17898935ec7f38f302d6e1b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da75d6c1346c3acd28adca0b773cdf74fd06349f40339c6290cbb65ca5546d75 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63a627ce7465def026865bae5f97574becc4d387 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20fa5a9a75c755296dcdb384f1d16399f294ef07f3328d0b745ec0a122238302 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82a150b04db4897cd633dbe6aedb04896698998c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:582fffdf06fd6136ebce95eb1b2aa02b222aad907678d93f90541efc3880d626 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5e7f1d7dca596c9486e87a06f39bb45624c666b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22f1541ca772f3e615b822f8fdccfc63ca7277991fe59e883f3e3b38785a151c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72230268aaa6aed4754acb57de9a1a91afefcedf --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73976b3264cf02dd454a607a8d20a04d85744ffd7655c335302c5525c3fecbdd +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f57f6716c7fb9be31809550f9c9984ea65cb52ca --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6679773613101e06709691e1f80be3b68df305d292aefd70e176b828511c1652 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeb36251e91c421f37320e37827339573e5a23cc --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62838dc6fa30812999b5e3d4efb742a2482053dbdf9cf87d5f9aa12f15d03b67 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa1ea3f51c0e2809222895c3bc18b5783e795e8e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:446a275d8c1973429cf178807fd97577a8adb62b72c3f51a4142ebef7400de75 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1da7fd1e85a5045f9de888018a73891ff00baa0f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f072263eb8b7e16c97179d14892c0b6d0c6070ec1c023689bd0c1c89f49bf783 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68814a496a10bd02d24358201129571e0d23328a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c75f75a3d629bcf703103a96492d26beace3ac3d5a7c1b5fc79e8ed268bee9dd +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..852ab2cca03b53009e48c58d8b6ab7028cde7a15 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eaae98b0af6d7ca2338e596eb350b0b9eff247d702617fb8e0cb31483c33c74 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..503beb18464b8d8897be723b4367bdd2368a266b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc8166d13df94e7e39d02d2202d9063c3120810ae0f44f684c77bc838bd4e9c7 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..036faaf2435e2a76510a9dc18ffc4e4255e71135 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e41b4cea69641dc348d5a09669ad60603d788544c60d0c39f7d868d509313a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c42f772a0d76da68c50958dc4ba105b1a6509c6 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a50b1016cd6d5f12e727dbe3345ab20a43cff14f01d1ea2ad6ca8e105e89da3c +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a4fdc3d487aa26858d268b5c55ec025b80ff6ae --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83ecb2378ad5e14bbeb38273e4bb177e43f95b897d0bd33f9bce4357d8e18f83 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2be9a1bcd92c2729e70105dd146628408d94baf --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:992cc4980a3e36eeef414926e28760da35b50c05daa82a15be49619dbd92c405 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b195505505aeaf915bcd8e56c12e4182cd6b3c71 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f51971b86db061aae06305927007892d354b00354b98cbe1978da3b2980ba6 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e24bbd176eb52a3dc15e6e77e38a9174c11ac24b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3315597473931e231528657a250583caa053a61c4212c47be7dcf81ed35ab430 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a38e3c6ad2bc64b21e21dd5415ee942a4364ca9 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db95da651455809c13f42bd9e76b522eca378f3c1b3e8e95ef8a872500abe6fe +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0bedff4c42f4c268a6c1cfcf3608a26e7ebf8cb --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2e355855d6936c1b214a7a1c1cbbc2ab06486b76f8cc1454eb77b6951c3ebc5 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f75a418234f0a5725f40ed6ba6646d5ab020a59 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6aeca28814903ed5508ef7f1fd3494b509a5bdcee87b19f38de87ccba8a4db3 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e744c5480dcddbab1722e6ed38b6cd6690d94c0d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c0af0b7d1b0cbfdf65fadb4a4d993587fab415b8e2600c1832848b160e7cc4d +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..813c3a03ddc8631f6ff4db330f934beef9ac4bdf --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:908bfe4d13d165914c14d321b3a9383fd3606e18585a9f428d9aa315a117628a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e65159112092759f47b9d8298ef08a02426f5fa6 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79087ae1f53d9bf32e8502ff60990738aa6ca1baaf0ed76d37e1febc94f6d7d9 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c76be78252ef7ca97f32225fe32b589007297cc7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf642f0965125f20a356417b633a18dcdf6f23dccaf5994f886d33e22a5c9ce +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4375e4265574a779b96ab8e651ae468d417dd1d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:373578c102da70032d29bcfaf566281b3d98c146dc4b93c8654c534009e99961 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a61e7a4630ed593818be4e28d3cf58704ccb6eb7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d5f162eecbb4bf0deb55c492b32ccbcf271c6083b962cad597018208a4df6af +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c44efa243dc99323f8746945312c964a2d3eabce --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec47acc563197b8eb4a5f7eace26eb0b67b565decb7de1ccbe27b3ccbcb8de03 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88c309a8607f49015257b5339730ee584e0d3a78 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6f852665a61c3c8c2b7e1c049f2d7b776f4a2ea2fd56281e5d71dc76c01c735 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4984fc5615025d8793294b59e841434f8fa5c15 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:021da33064f68ab6cdd8b56d2f598925232e9b123f118c20d034cc083bce1295 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ac0ec97770789efb4d13d82aa4ea8ee3ade0b3b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dee09e631295c50d6993de95473d8e117791baa9bf53e3f4f2e3a35ee14c00f2 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0623bebd98900436c024332536ae5ac7534822c7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:436659d82db347ca15c49f9159c7f21fbc74ce2f7a52ec8ed935b0115b7f47e6 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..661e95b1666c14b2e226ca78b9116dbc4f0b83a3 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:648ca7f052ad9be01ed380091f89fccab21a37de9ac1e4155c2f46b7230a1cbc +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99ea83675e4e02825cf27e70c1df461791db716e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556fd2a19a50c8450d3c1ac33b33720840838bc62f565e4d65b4ef36f9210fcc +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1b4c182b35655cb99e299b709c43899858e0d90 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7465ce3126a071231df7f44f72972603b030076f2776df99613e00491e88e71 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5e56550615e9c6578eac582ce761264e8c6f0be --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e01f37b330558591680dd09ea36ad6f254ef2f43615f5800333af025b07189c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7363ee65985f88a2844f440da9160bb9815817f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c879d6708e7ac56fb6fdb8cf83116cebbe55ab560ee246f77201f85913205b1a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d7dccefbbe292b84b3b2b0c3e2d7718cb28a0fc --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:398ea4d4e870e4d8dd28ededb8cfd67b9ca732b57da3db5b05985e4be7fbb5ea +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a3f181dbbf8d62174044b14b66ddbc731722d3c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8d0fb1d878bee6091cfeb450037305bef76e8a4f0039e60774b2323f61b825c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e44b099d6a78700f443e74cf579a01d5b78b6a1 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5701b4619f0429e713b5fc2c9956eab756c690b89c8c17bbd5c0265f2d2bc513 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75c1cc91c7f76b94be974ea48e094ddba8648a2a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c50829f53237a70ab1dfb38670bff6384807f7a9f5520075b9bb44ef4c3678 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73aba616d3dae56a8f49423e1af144ce3d884c91 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f94fa76b58fbcd61ea3a925070a476c2aa8e139f1b66f6961604732cbee6ae5f +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..acc64604562ca9cfb79edd3e8063a7031a2353fb --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55c1d763a3d66490e4704e54230302ba993952b02079abd9b7b03bdf369afb8e +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53465dd1264ca95bb0c7fdcea59a3fb1153fa6ff --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4338223afe92489a8dad1b2cd3280bc17540733ec5e34ae65fa1b86bf388c7d6 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e7ab44bdcfbf4e2cbf229ec5166a916565eb80d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22089aea35f7a6805b3df90a57ab19a90c608cea799d61426e7c5aebcd4597ee +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ea0a294bf27276826d2d84b9a45b002c89a9eb6 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e95ef78cb07feb82b180446fa5e19841a41f41612d7b337ec778a359b046902 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e937a2725a33c9e1f6a467086d865bd57661e03d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f98f6e7bc775854d802e23cd2aaa53da961993ef1717c1319d888b982d427ef +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17c24898bb6294597323f37622909ac7ce4f2e37 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50b91d38b77785c844f0e10e0ab2159306c6fabdeb2a1726a6c2c85e4e270b64 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c6cc60c4530880ee31aac6e03fe86a937b85176 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8459799f4110e0681984966ff7cb68a1292c7ebb638787d0abd2c1de645f921c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c961ee1b9a115ef9823480ef6129cd14b5815e8 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe483df92cdbcfe8718126c52386fba6d8592736caeef6942abbb8db149c6aa8 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82694ac12138ca7af0e76d3f062cf169c45191b5 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:900beafb7548a3595c03c51871c95d9d255dc0369352895b89c6b5659de76a32 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fd9607b6d44575dcaeb7408fab145df930ec7fc --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b83c0bbccdc23c104e2d13b967a226f0c07b1364f23d2ea98fee5ac7e19d1e8f +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..35a35090fd32c98b668703501e097174c55e0e0d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e39eb32ac5cf7a8d4f769ab31d75971a995f5287dfd0f02c75a6bb906d54a8f +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fe7a96fa93dce8c404ddd9812817d6e00967322 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ef93f9aece73d23d934cf32cd11f1c1c36ea44e0701186da2b8e5c92fa6621b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5660e08d33f5cb02f60c71e696d1c9a3b72b9102 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00cf8ce6d5586b419b640ac14cd6b64694a19059b51c1904e94dfbc42371467f +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64b41c0ac518a7ed60d65aa6698d4850818fbe62 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a37a9c63220ba44828d7993f15f8f7d5fd8d5bd5a53a18950da88e6aef4aa6 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba3ac3ff96de0440c8bb6df91244932218407f91 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e6a510975476f265400f3f5dcc71d3e474d4c6487b610884fd69e9c5d09bb31 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dbbffe645273662d35186b017d316ed08ee570b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1856e4cacaee1096d0c199e83736467730249866dd969580291cb8cbcb8bcb74 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af1bcd29a29a5aec81ba04d55b734195ef149c2f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea6461d0e429ae810388285a4d33de692b24e4771910fa41b84dd9862b065f2 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..817547028425e21232e0f00343128be61d9a6346 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3538d7ccb434da686d8a1038d91332af85aa6f80b37201bef97a888235201a2a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c25e4456c5a48df1614385ba678c4755dc81a3b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf70bbb1dbdd71581c4b38ea3a8cf2b549280a95967a0f57005d570336cc5ee6 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5166402be0954837a1cce6cdb90508f20ffb570 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:582f8ecb29fd8497bb9d0983238a31f405224c7c46104ad0f79096770bfe0759 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9119cdc2f96740317cd7157bfa5d5b069da8de1 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbcc098cad789470351078cb276804d0beadde35afa1fa0983d880862a3da516 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23cae06a89fec1b70b3c51440d93041e4002e93e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcfc4238a616bb3d6415954aa33c9ce39379526665e99fb5483715104605150f +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..674ad00aa172d950c28ed298bc6b708aa9f07732 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f7d459ffb32a7251fae161077139a4ec6be178010612113d06da7fe12b2812e +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f093611c3bbaebde31f8da5fce16096480420158 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca3114ee36c2d510ded6a84fafa94bc77b9230095b33b02ffe42d5b3e9b1a9d8 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1c268e00127eefb3b7cb0cac45d9bc3545fdf76 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f3cc0ec4a275fec32c447081dd5cad159dc146566782a5df130438fe2d1e769 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..295b1da1b09f497f0c4ce6b12b43892df4d22159 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0378e5aeeeb16e69c9a9d0583e6b7e93a8adf21b4028caf2ab69a52688152a0 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4f07119b848fd93479f7615e76736e7ea4b9091 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b93e18f3d7eb9f1a84353e24d25ea1031a7cc8f1b57ba3e3b5d6ff3cb6dc43a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7283fdbc5b09e9480d88b9a204bde8e7e1d57f82 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6bfddaaef94bc6b707e2f11d6e9ebb6cbf9b8f22e5a9d4c16975e909bf2bfd1 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e3b98d2e92431e02c6d4a7237d9a21d97913653 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f121c8d166dfebb3b3a75da24ebc5af55eed289a2d1fca5f4351dab1cd32acd3 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..811c23e6cb2d20a1b4ea719cbcbee9a6ea084e07 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb9a4050693229b0c04a663e1c240de70cb75cf89b4d037077bdac2a28c6aaf +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f02ba6012b7c312995cc6a3538a5b991f3ef142 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62865e5bc0f7452c089fdbbdcb663ef7e24674456b3a665086480be8f1355548 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d55d4615b57b97ce070633fb75ea406ad26c9c9 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9da85037faedcb4123c48d35d55c116a512c3cb37a763aa79697b7e5cab5888b +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5579ac595a74c896f52c7cead50e95b9b524eb5e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d460d2142cefa7251e884f396a6e583511d53f114eb2a991dabe26798cec6ef +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0950b4fc27d49672878215fe709f7ed570543bb --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91ba402def00d3fa5660f2fe2049120df60efc618f3d6dfd514c0a6df87c4511 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39ec87c073646b4ec06230c5c7fcc08a2b49a9aa --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08dfaa3c7bc8c92020ad2221fba5b0bdf139ea4876aceefd5f6b92d7c3405526 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d3ce76aeb5a6bc6f9538e12e21020bba985eb48 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1e5806ed2f64b5040bbb2bd456fe3bedeab3b0ce53416d5cf616334e84e6298 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c48ad6acd2c50ff81322fdbd8a9ac8fd166aca4d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c29232b77b20ae016a97da84cd93aa397a5549dac2c9806705d80197a5d65abf +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d9dd268f301690c5f3870a9518d914425778c01 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f2ae58e31e4f7b82122d6c58d795bed1618471e62272feab357cd850b982d9 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7cda206d0b8bafe16daade168cb3d9573db93c3 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f4540f4c71e0edb5ccf2e901334a391f2f63307fd939d2b56a6eb519d54989 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46dda269acdd39e7551cd9925c7fe59e75876ea3 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16afcaa5b46289edeaff5c013d01beb9a2ee8871c143694cae833d07bb29ddfd +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39ee32cd3b5be7ef110364ec3c8436b352424b24 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba0e978fe5861fe085446d85f0dedb844c6dc568770fe02142c1ea7be11f0754 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46e5c75855d48ed042f492f1c433408ef4b95819 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad9de804c3a9c3864e3ca08f9d34d9d4a123ae76b4ee42f43df878b1570295aa +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fcaab1c967ea28b61d3fb060767dc6a00cd389 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4646c8b8a46a9b43ab1ee5fced63a5924b76618935d9149ebd8660d60085a4c4 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d9b64b4d2167674da8c47d2e9aa4e00fb6c484 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f58db866e9ce7ab6f1cf404a4e6297e3716687d0c53ab127a22b71cf8c915a60 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b57ac4001fb6366a673aa5400fe7ff385d968b80 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91cc18d9fe311f457d2386012076590b9c132e43bd9c448358f8e2fc4c4d0483 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e17cafed28686e77c369cccaf1150187e126f62b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:976fb976017bc0a65bac7c1760ba725c63a5d6a07473dcdc69f90b8cf8424f6c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca8c6266127bab35478d98ace6584f6d470910ed --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c4e4b19a82a343686259ebb7baf6ba8ab8c4c812fe7830ab6b94b43a6748700 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a979241caae05692f01c5a71fd23e6cc52a5273 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:051a9ad85f56f10cd892cd6a5a1780a157aa0a42ee3a1f6f3d2b43f58a4e3068 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55829a140db924614b4e9705ed19e4254235b629 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e26458e66fbfd1ce413a61cf363fa57b2590e387a3190f61b24e5a6ae4aa17a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f74cb60e8e27f141e5c468602d8df412c41448e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ed44a2abdcd0ff1f8617cab67ece1906144e30ee779615702f222994c991239 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9169726db7cf64bf5e17edbb312cb6a94c13415a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75415cbde168918de48f28d0b787c925ea3da9de702e7e50921a88432935b35c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75b9fa29e02f56388c197fcf989cc1e22ee8a7f4 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949a6c779fc6e9bb34db71f5ab62016d27b1fa7d64d5a72ae3c6f9efcf73905d +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a31c04ebf67c65989d8c1702c46593a533af6729 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08b4ebb610a01fa44e42d9f8aba29649e96f925b800c0dc38291bfdde8684e4c +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b279249aab1b14968e68a13f21169e2ec33a8e88 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc4bc94aabcccb48491dc023664e49e095cab3beb7be14ccc24c6024cd62ea4d +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dd5b71e38321ee8c590fbd0d4406d5e91db034c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1785250f4de4c120592a569317d118a7faf1af72d492ea498b3646f469c48411 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c09fcbd80d1e837ae25887542d2c5c4b373d7285 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa8c0871588e50da87638413f045306b95141a90d8dc915571e7b894dfe48e7 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97770ac9c5c1657fc85dbc80e4ca5540a4819cff --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51c78a10966f69bcd141224a3faf5c2afab662ea28f0315587928a1e95d0ecc3 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad1570024308e716ed46599413f97a21cfd77469 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90f6b87bf8430dc907e2e6804918049647f0374023aeadad05fb61ec539fb1fd +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56fd67a73cf95c282591cb695058475d7e499e42 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cabec9dea72476b12c55a5714bb2a1f64817cf182ae530836727766de31e0ec +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3b16b16242596f8ae6522b61ffc40f4842ffebd --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfcd30b5ea5599833da168edc6fd172e881c8e9cdafbcb841bc2c41c44ebfae1 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0881320dc392f2648814474fb409480d696d514 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fde02a2102ed07cc1c2cd488c52f8186b00c3489baa9b5e1f036dd72dd4ff36d +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c67146d0126794c3455d1a6faaed2e91076223c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7e86ec053207b15df5add23696ad33907d732902e32298a028e33771e9c48d3 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f69e5c93dcd0f5628359c6146ad70e5a948f420c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556a6d376271382f24422fea89fbca1a1fdd9499f26ef488bcde28626f310035 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..687f441681ed11cd714c054bcac2a6a00f1744d7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bc599de3c4c9490ef72f091edb5de6a32441425ce74d76497fae609712df63a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eead277ef355d91b9a2512f672cd1ba234a7e3c7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:013f77112434a24d6b905ed5db4c13f927faec6aa38b9fde67ee3c094ab74d4a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3bcf6c3e67d4a931dd0148839ede3d3b2bbb677 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dcfbb965d67288e83694c07f29268cb293659a8ee290a2ae304715610c4b360 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96e305bd708d6b809751f9d19f0de3bdae9d81c5 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e993cf0c466701b1f299300ac3bd6d08ef69a71848ab7fc180b3f6e9534202a8 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1d07ed4f7a22d3dfe57772e8fbf9688877ab45d --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:565c0a2fa65b30dfd8a8624131fcab2975b7daf23bd84afbc6057cee43e18acc +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6445af984fc14316faf6496f36b00b54480a8daa --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8be7193e82da0eb1e19f8bf455ec13131260c1ff35bcfc591dbfe9b0f6756b0b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f1ddd0d47a2c47489f28304ce0271ccdfe417fc --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7b3ce9225b0134c5608ceeb51a797eb452e5c2e665018cf1593282c6b79a291 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34a52432949e387af8013393bb2eb85d81bf874f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1a02eb94f86abdabca72c284765bd9abe060803c43b01906e6ec6db9dd4f0c5 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3f7304b8055ceef5b1eede2fe97a74e268a4966 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9bc1dd7a6687645d6358845cb95df7b1b1a220c7570dd328d47ca5d3734405b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..705bd29ac81cabe35609089141ca6249df301bd1 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bea8a1609d2c006f3e94ef043323a3b0aaa34136921c38f68bbab5c842d0fdd +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94e834133abd11a288cc2f5e39e0ef1df6d00cb9 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ada2dda3667d9d7c963779d312bea24a9ab00150bcc0a6d3409799b86b5e086 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a61e55ed3f2aeb58f2d6079378b30eca054b5e3 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0691a87bcf9f8ff15060d24686a9d9b33eae7e5aae15b3149d3bd610afce4941 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38e78d06f58dba7c56233db2e73c9c98175acddf --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf779eb34c394c76cda237d1bb06b98facc3447bd14f94a743072394d79550d5 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2f56616a90e2f1a64110f681c7ff07f58598a5c --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad5b205d3ddb526370be9e804747bbe20ae232acbe4462947a2bf42e0f8b8137 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d742e9f6b10d9f6bc5fbf62f60b06b60ac3b602e --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dc5951197f46f7df6f6ebc0968d683d3482a83f8051dbf31c7b7a1894dfd31d +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17a080e0eb986426488abac9a5c10ba608250d94 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69a5f6d9f18764dc2d800315c81e558ca41cd09af22bb78de5aa1d76c5d3246b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b27ff2b6586e2c25251d594319a25c052874e70 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7b67eb2be99b455b17570d1fef061faa2da968f854a2eb04e5d65b5141b50d1 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f71f2b047b2459f982729862c253e4677a1bf054 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f76d721ed2fb9869205bd8698b86aa85a19f5d48969833bf21f4c5fe0e3cda13 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6979ecd9ff67dfe33b55f616a5aeb669be0473a7 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8b9fa5354ccc1ee877f0c08ca8e20622cc8cdac343c1de58130a7c680577824 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a4d396f55832cfcbc175459ab98bf4f906cd46f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97043f645ebf839628268e27e9c4c5e7c124d3cdaa81c4edfd20c31106e9a39b +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cca3eee52acccc9fee04ea3e70768e24d13eb3c9 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d1d312e1e2b0f4f996224b8b35253ed1e7c8e2955b6a2a26b03ce2375817e2a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..843c1ffecf7c4fb133b0a666fe29c37b9b441387 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1e47aacd5e57349800199f9c648fac0d1bb80f8089a21f62e9d9a6ecce4ae38 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..608d1fe69766edc8cd05390f3ee7c069f17d486a --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:891ac52d76b8632cda6831fa2ff272e70e1e242d2c91a32f3ecea79f4ad68f23 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83c7cb1f54b2e6a6ef27b4c62663acc5093944ad --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a84c0069d410dd97f378c9c0b2268bf370959656463541f9bfeea5fdde00e24e +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..501986327af4af029abd683d3f3f11f406ba5b82 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03d41491dbc3824ced9de92ed39c6d8003e8052b072c6b836069a79cbdec17b6 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ff2509f13efcfd01ae9bf5047c59577fa694228 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de36f9b0f5d3aa6e1b4e54d1f2fa1468918c8f7ba23118efc31989239e997ef1 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37180f63d7abb3c82cc362231b8b347f30352274 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21d5b6b96df9aeea7bf4c53d87fb5966854abe3ed5aedb5ce3f1b334d0e890d +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b78ad94156f0bcf5c3db550092aabc18d989c63b --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292e736f9ba2d0202c9cadfebaf8dceeeb89fff6e943644a4f780ff4a24b5827 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cd3e47d531d1acb5db8ae92b25b61f5dc6c94fb --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:422feef8141c45fe9ef65e05b97e25d52ff14e04bf4ecfbef90d279829a820f3 +size 42115 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..544dac5c0e6fcdec1594287ad41b0e6cc6e3a4fb --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:601d2f9e60c204c49a0f0d551ff5dbb0e4b81512abe9ba2e9396e599d6174495 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34bbbfe92a5207a432bd5dc3a536360acc774fad --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b382a194ca7e9c5ac64f999f4e2f3e0c19d25c783cb6f762a1824716ceadfd43 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc606316aa6bf2590611dca1ad730abf0320162f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0d66d96e637aa6521503cc71d3d5542dbffd6816f00ec21a9d718abed6a5c2a +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce323acbb06f4e5b993bdf2dcbe60411e19a081f --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5477c4c063c37e1244a872f5c7755e0744af49b0d7aee496942d58251735bd24 +size 11395 diff --git a/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9635cba6fb5b59b824eaa23b1c47af3e25e619d0 --- /dev/null +++ b/params/phi/5/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60f7dbe7fa587dd78fff2bb34f7acb84d48c56859f25cfb40fed857b205ab944 +size 11395