diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bee9fae426ebc6b3937dc2007b3002f989b7567 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5c5ddb4ce569e2386bc734b66208dfefa3a05adfd8381899bdc065e9e3eda94 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..655662c2071d1171af7ab11c4cceeedef39b0651 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:215778505ed325643e60dc1e131eda38c5d7c8735c7ad8ecafea17b6ce214111 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35fb33620d9178c4ba31539e0c722ad39cf8ad3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aaded01a5429e63649b26b3345c7a92be50200bdb3360c8fe84c9e7418c866c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5146ae01635786b2a707ea0fc7c167f555f5ae1c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d24a6cda5b5055732900bbfbd32d6fb67b6dd610976a6ce2cccaca922fc9c0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92e8e0985c3179380d0c58f17050202e7507b1fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d22fd388fdc29ba5d7c6bd8925a165fa4680dc2634c2eb8c569ebfc3ed3f70a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8b6d72d781168be5d9f48452e6e8b8ec7d227f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e4b6f99a181b562f97d46cd0fb8141f6bd103f635209d6fbc290e0ea26c1ae0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..090daf0e2cc122b95b2a84261a866ef6582a3016 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66ed43c565dc73e036c1e0d71b283e55bc4f28253603f6b19b90f6d26eaa93b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..566bb1f61a6a2a0803b233923855bde854ce94d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72a9a10fb43c9beb5475a7a4b9796bb9d0ed787f22279909f896c64bdfda82af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dd69bad95d2a3905d6bba85046cd8d8172c1f8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aac7803fbd58680c132d111b62642b961361956dec22de80bcdb66d8b580142 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8445c4b45b22ad67592a6834e5669d6ab160eaf1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7309636e77e2159c9f78082410413db689a4287a06147067d7c8ccfccc615b1c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b622f40185861f686357ebe10c82a7152a39d59 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af5e87485dd1e84e69d28e5f06beee2abbe34dc72f641b610b254624856058fe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a737b8d02b913a9114de2cc2e1230b433afebba9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:423ccb529b017a897b1dd77b9577390446122bc173963565c50bf7a84579d4b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e161eb415ee52a7e49e88c92653d391482a13d11 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef352ef3dc04af4532570195fdb32d1b9c9d22c9fd45a35ef16b075765c6b1c5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49657dc586163c25a85ac1488ec8f78c2ec01995 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11a249705b353d3ff61322f5c73f45c5d1b6bf8669806035430260c2436732b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a05ea7dcab9c98382721b53e26db59dd40ff6a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89aed12ecf1297be0440fe757ec65c3caf8efd504b638a7d9881c30837396ae6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c13ffce2a93bfea6b1c73624e9649acda632305 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc2dd1ca72d468a09abe4373224c92a92c537181a3b7db741adfc0107ebaf494 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40786fe52f2b6f0fae9efc81b8ebb0c69e6e30d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:741f62050d7b981575232545dc3a37914e22c87e61ee302269e5ecfbe792d58c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a34fece475647bef1324f11bd29dd0dce0db636 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:585aa3dce6206056caff4a29121250111ff137d0383fed0d389db6b595028552 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..14b1e66f849aaa2d22a995f24765f308b1b7772c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977f686229ad42e64aa76dada78ce2930a33ce9cb5e8b79892b0a7915daee779 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4635169b4de8845f05374771e2078f0590d02821 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b04dc5bce2533665eaa6d23a0e5fb40f8212a37be2a362d033a7e2f9a6861f19 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64055840a4ea92b6e86c22d64572b904b904fca8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35196c94476d75a92a82f5941e265e7e3b5bf0d688acb19d2cd27ce4b9e1ef15 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5490bfe8e0fe5a2cbfabfa9f752b52c6bf8ccae7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:351ed68a600d5b347357d452b86cbf301726ff9ead0d21e11ad49cd2ba084506 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b52938c6e05b77762470426ae81421f0be7d655 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73a669db38cdeb0537ae2690bd49964dc9abc909e40af0494452c4b17ea53dcd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bd918d73a8bb2e0877026f810002c400564cc79 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cd86184b640893bde9601c71eb9eb1b6f8346de6bfa9683c352648df3032758 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8db683b7e31f0c0fccbbb436ee2cf14424621940 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0d3090e0d2ad049523b37ad3864260982bf2dd923bcb9c67d60ae2be914feb6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77351512b1fb721ea4c766f2f725e000689e83e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dda630c8cdb2b9f621322bf2b0144974b9e1bfc8ac5daf3d9961a870aa83ceb5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..af7f9fbbb3805355d22bb819135328f82923412e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35e253c43a4c720421345a62a9ee464316d7b313deffc7e700dbf16e0cf3a9e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df80fdce10a02bf86af85fd9ff6d977f0f2a2e70 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4e0066c31be32fc96f83e9b7596b213c56c657e1a64010414c52f6c783fbc4a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69330dbc1ff6c0841b6319720ac2a5a6a0f41ed6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14e9afbfef35751dbb36b5605228942b1843ecf5776fe0df4cc0e8ee11e4242a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f234707b150bfcd7af37e09f1d93b99e312ccde7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf13f0db81fd10d231213d8e53858337c4997da27e24a5fa46fbf05650e3838b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..baf638e46d6ab2cf9662f791b9456a6d9e21b724 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72d74f592dbaf2a78b7134b196f03516c7aad8bae49e1680763c4dab45fdfc55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..370f6d24a431600a51426ba2faecf54b45326157 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06e826621a1034aca4ee6c5b440fb5ce9d2ca422e08815f4d91f89aa80af1638 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3445990e05bad231e2b0b293f097d485d14ffc08 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05f3c7e72a4f130851dd32347036d4b53be235c5df6dfb4fb50bde8b846657aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d3d826fc81db94626977633be65c893c1798182 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04b40897dff4dd52615b8ad920cbb140263b690ad287a83b5b6ea8a8cb5dd72e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bd86eea4a7229c18cff9820d9242140199d7c84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf4076ccb551740680adcaca9bd6e42d38cf0cedbd416bde7a3e83818e41f545 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d30dee700ad223ea814efefcfc56a4df40abaeb5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e776009dd002aa79ff4244f93bd3d8617da3f6180c0083daf9452b2c24b85c3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac9d91001f8e7d743833b8006221de1d205f9a6c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d7e4394d3522539e2426b932367e304ebe46992b42c9373b35512d2fdc75362 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c75538370eca1dda3a478cb182aa62faaa231e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf9e37785f8f1b05948320d4df379eebb8164ec8fc6f6cac46479d1c3aa91ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fe2d930f34268954d2e1b00b541701493f93eeb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a8bb7ed65e6d9560d4ffe276686e80f328e4a53f2586ad3034c7a021b51af8a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eae5736291b878d998b14c5e460331586524e8d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a36afdd5923c893bba9d57b788b71b846a5abe130b891c14d59ae452658d8f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..045d54b39767a90c0be5e7dd9cf0d60d38d4fd5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2f9bf4996f86066399fda95b32f0ad3a2e7bfc8d685ac9a15cb0ac98e12dc48 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..672fdee14b0d22bfb8834d14afd42af3def8a368 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ba9173ae067a6e5e91fc92c14702a8183d788cf61e53aabeba5cd445de90d25 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..569da7d75b74f5a5f18f1802b000997bca1149a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21fc8500b0afbb73d6e94bcc9d7a31d67d31af87324c3ab4e9a72ba3455d3861 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c89c0aeabd6b487d2942dc84fa31073e21af4e2e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db806e6062979b4c31dc356a1bbeceecab3b47ecf9430f24212c7c01b0425923 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d4fea742ef05afd88a35172c480366ef09d01c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b66044dff3cd64733b1a09c0da645a85625ff0d4a37c96d39878bbff58a6aafc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f1c03af7ad574ca27ea4114d4e15123f0639459 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c7300517424735f2106b32b87887a6b7e6cdd7b260277a68e0e29e44fa3fdbe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9c83badfb0ff731a266dfe4840e07609b569d03 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f4708cfdf5964ab219dbe7fdd2f30de8c0478ded58b8a2934ecb72f828cfeec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e5229e75e3e95f6ae5c94d6b56a534feeb3a87d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdfe09e0858c7969e8a4aed44cc6d7a02801ec238707bc5c5565c855a10c0297 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c18d3c1e9c954ca4088fb804dcdce7e0201d5dcf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:710fce6a803f1aa7f46f362e1031541201db6014ede137f24571c2cffd4bdac4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a584325cdc3fff9841890febc068121085d441fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec851b663ea98b87d8726505ec76c180a188c191fe17e581d54e394c5783f8d6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4ddba9f11f3f57daf9e8f661509de99b1b6a654 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8234c1eaed601fb41ad62336923085830600aee117e030a7f1a2b01fa9838a37 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5decf7b9cd552daa5457e5ab732a5beb9f379b4d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2978153877ae6d67f349f81bb6fb1bbb27cfcf96a431f7e6e2969ebe39601c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f7941ba39eff673ae4c39325636185dfa57725d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d190b4463ef1ac7502b7b720a2702d79e491c182b9bbb45bb3b88464f1b318d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aec09af504e0934bde4a8215f63a2ef14773f46 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec179a7ef6b07a0f5a5e3c898dc4980f12644abeed9d81b2ad3f31348a72de49 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe0fdc7b3335f3e836df1edd5a12c4e4751f31ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5a44519050a57694e560a4587f17fced5a08dfe570d91bdb48f8852e51bc3d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74e2b6e1aef8efdf9247f86fc84edda562fdc47b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:004e2016baa73d4d4b22df892930c303d67395f4b5981adb45283251e76f817e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..946c3c028cfc2bc00313f8c1c7489139224ee8a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73dfb37344bfe6a2c179d22b9fa7a266be26e82aa6fd9ab9ddd91b9ea2fce40b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70f5f5be366d9ff3737a81682cf7eb507131e949 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b19ea508abf80e987a6a980201b8d2c3bf267d5c13aeb67209af6986150115b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..573d6149ab60b1992d5eaea1dae23e6cbb804106 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:690de9291fc91b9f6e91c5b288be5c7256d94782b294740c42d70e83f200fea4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2487171c9c313f57d43bfe2b51805fdf86bd451 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beca4de9c748b6b8b0ff40d841197c2bf89735a8c7e740b59966bae84bc718a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..afd8bb1c3840c25e8f1710359fdb2d9248336159 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5958047c9e99e203fe0d250f571017d8dc72949c7d1735c0a63de848faeff393 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc02f3ec709cda035c2ff61e9fead96741b89386 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:802ef7dd90dd7562e1329386aa05e56873cc333f2743abc3a76c590b6b2548f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..610dcf47a7d2c605b98360a9e5b00272656d9422 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3469c54152da642052dd87cf91b46451e81d9a3ea4d8ebfa931fb643b657f598 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..796690a10aa1e28a5155dd0666a8ed64cc00bb98 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bebee97279500e6c1d2945fcf2184e7b0e3a3b854f584e1c80dc80a398086203 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a377ea8beff1f417d669d56c3beb4634707e6e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a0271e591b8685e2cbd4f87fc107f62c4079211a563f292e8c331c8e7b6cb4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5ff85234e64fd72a06565e6ca0a2fb4aed5d1e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3cd702185f7cea69881e7fc95c2b196b9fcf6599b45f8fea1f1d85b10926e53 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1664418d42924264ae16d626fabcdb8bce784b5e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf30934915216fd522249bb1e29d62a608ab68ce48e8e60a9f0406d5ae65b8bd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97f91b8659de744f8835a81efdc513e81bf06dfa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcfb20e73656355deb82ad673e6a01fc1082c2c908296d36c31b6850d65445f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..010bc0f08c80dd714209f06198279124c89fc83e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24636e9eabe88e5cacd60ac28ed2d9e70b6ca22bdd76f53f6522fa1c83dfbff4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..094b6e3a384929f2e4600ec9f8c63ece83b58c84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cbb926d578cec1c6ba268f3a54641ac7ba3f7eaa06a500073d9c5b418c6c766 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..85a237081987c9e544be1501ab1d525ed1d80e00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87e443de45e7a60384f66eb5686cdbca3f2092271a4f1464068afc534fca0d49 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80b5eeb48702abb86f7bd571f64558f25466d661 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ae293c8dc61b9c29cc647bbf19d2a248ad1d3c9e23d0ff9d97762a2d138fcb3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..39c465726cf43c20ccfd76b33d5c71b71f70ac39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa69acf441a33598be452d537d11e0b266d99004b2ece904654f0d12f83d1ec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8de157cb626eb7b261be8e84f9b8513471d4c0a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8784f1561c4d0a79afa79970d4e66c640ffb2e9fe2920bc55530024388178a8c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fe150ba6b6ad3321926ce714f6208a60b9415bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3a55056f50e82628b7c4bf35a7fcf9251219cd9ae0dc773ece337fb6f6dcf04 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..992dc9517a8050c5859acb3354ed31cb52d095e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca0688217a26c24031f23e39812979f286f7551a3b0c3129ede76f93da04ed88 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbd1cba611cb8e181ddd8e63c465b8c419d3ce33 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:376ab501b0afa8c49f425cd015834f55dd2bcf8b0755cf3de0a4fe7e1b46a69f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6043e6f0ff8987d3541eca65908b2db73e46bdcf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b7dc81067053191e65f8bf8a2d81a2c010471d0ca0dd2324ccf42b93cd9cd3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d4fdbc2af2202beafb824f6e58b799152cd2e67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6925fb3b10786d958935a3554e93725284dcb8746613359cc172ea8ff16401e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a564c78eee70302218a65c9529e51ee28927a534 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:201da797876443a91a669342c9593423ac9ea070ab38c67e68b19ed458fa065e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..506e66181976824adf633baa1f260d3ef651fc65 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:753000f34cd8f467d90bb3229cf934f8bfaeb5e3fdc9b2f17630468fba47e1db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b9de304527495226a100b88475c983751128674 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bac5498ac0654379c1b8c7107f32b040bbe8348bfe2b5710501411f634f422f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eef5deb214a57c584b72b593e08a1389bd99774b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eb9ae2278907998979ab4b4a0fa39fe583a33bedaba0a07a61d64cd1bdde198 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6452af9923e0e29481eb1f8d18c260e5f8f0c327 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ddde97d1406f0774a95d5700a5a6aef2c453c9f1dfbf77c96435db7a8bee261 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d474b4aec206c164c15fa3a2d9d1585282fb8c78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:add5ff8540ae4b1f14febd11872b99c04f3846523b90423e36307302613ab709 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..014ec0fb12610c32346877e81a14d388d8ac9e36 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b90597e09c6c59ec17c0d9e5cc1a28fc17054674517215d33aa4fbc103f36fea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..89564d5730febe9df68131e4f357e897e36ea482 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82da4421a42f98aa975b78317a6e01d6af6ad7de7a6c0bb99da58d3f7cf3ad48 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce2179c022e3895d625c6cd4d86d23f146077262 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8e5a1d4f8158dc0b4c6835284cb31b965bf1661a6201b7ef889d74cbc6828c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d95a8b775c21e418deb17b61188e12b5fcf1cccb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7147888e7c9632a10f9505cdede8344209884b479e9b2ccaa5688423c915a223 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00392dc5c7c5b3bd5f83b1fa9bb2ed43d2cb3da6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9301fa482be022251cb145295f582326ba106042616411236cd2529d20dabb8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..341f57523c26c6e42837f000fd3419f828a729ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621c6264ed7fd78a688f6acc2bb64da037f8083c8368f701771cf936a017ed6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ac27d2c246d6b5acf7e1f24df302ba7d0f6ab8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c963db28885b7f221f703503f07fcc5c944232d2928db8e7de0d3899559e3581 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8059806138d22d597621105d38b82ddc0101c40 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b810ee90dd0517b6711317c13425653cd388f460fd2af2a8c8d6d4f0f9423b51 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b9e5ee3cd474fbbe8868a7a60fc5a0b9876b217 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f901eab994a1467129e9c069499bcbf2d28631ae803f89326fdcfd24fcb66468 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a7844fe7309fcd554abc6c2eef5869e90aa565a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede585f2c2e42a780f22f3de399aea254639dfb8aa08697e18771436dd622372 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbb8a6f1bfb84c80c814347bb0cb406ca4ac43f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42f8ac4b636b9e72ffa9680bf994207289bc8a9e4fd8e700286c575a4994c33d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1816244ca7b974e29bd5fb8a576b1eb227d870fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2c11f4d40dc9ad4c101d50cdf738868b4f98978ea36b092758819e02cb6dc7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36f1a98b3d2396e954a409224ef4f6a2bc6375d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91f5bc0cf7f59eed09fb8686810380f8fac2b1a0e8079d5faf9bd8728c9eeb40 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c6cf5d6ba4b27b860f606399f019c1d07572e62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ffd6303ff15d7f337b034fc74a576933629b65525e7b5c0a32f483071603c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..696ed6575042385914e7532e949598e70ce4f7a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8c12f1059a39de2d3c9dd10c85cbce1dba0da93c9c181f0ded00f09bf62a4de +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a350c9bf1b80c6e112c92799c340067c151843a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5627c47f77f82f1d1696c0be4d3b794a9b101d4ecebfe4572293acaa1d7fa371 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2964b3e46a9c71bfabadcae8d30c26a966234ac7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad3ffd68d577c5b0969fd982b1c66850298b7a5ba164eff00c289264c21963a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e2fd02f7f41399f3aab3cb2501c14fa297cbbac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eb54fa70d535e828be4e4e709a7478962267937b9e88a70375988777ade8979 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb33c4640dde08c27f602e2d65a8e7ebd2e12ecb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b032ace62587662f8830116bb40f91f867e0d4a4bc8d5d5972bc71f7857e47 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..78caa0e45bb86495960ae3006bf101cb99a1140e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68d0262f83ea621d7f9b85572e0d3132ee92497ebcb1e50d5428e29cdca0d790 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d39605cff84b9e235bbd0408aa6407745adebb3e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e35dffd890ddc6a4d972987f2b78641ae89d4f02c6315e4a7848a11f157bdd5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3e3690752878ffea233bcce080aebc0cb291330 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced728e9a5944fc4e7d26a9fc3579e137b99d997fc62ac69d52ab37e1dc0fdc1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c997b1fc7603bf9163c2cfecdd7fe32e20a7d28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed947d06d95b36dc99b84088b096682b6ea98d82215ff9b71c7aebd4ef43e8e8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa183d4fa312aaddd6f613c5f9152bbee76e2a88 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f2a2dbcaa6caa2d2a0b1cb0093954a4dd98147a06ac29ec6bbc43cbf9d0634f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d07a35f216b6e33f32e0cdd9c690bd366dda1ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de9b65ea98c65f258eb0660392f55209352742563e65fc90a4d54e6d7a94317a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00295a0142701e9ecf7607c44eed52ab6e6b5f6f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d2878084d6323a36f82c0c3b216ac0110e9bb3ccdcdaf337dff88851cc71e6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc7fad4d9b66b3faaaf001120d64c3440769b652 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d34c7f507d18d0a2e20f830f497813828d9d40d7dcf14c4c08a68b72725386ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b478edf3fdd792053095e13d2b9c8936054a149d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32cb1c2646625a542e6b846fc2107689e3157f21a145be632fb8fe9cd2d947c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc96fdcb47f358ace9c14c55f9a99b25ab61e6d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d10e3ed8e3b918f7e8f54aa2932622008c353138e5d689393b222df662bb740 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cec2a67e737fe731f71f30dc9cf885e900741f56 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e60983efa2eb34b4b1cb3dc9b1959c5b0f2dab6365f2a591de630dc3a500510 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64a23361d7e67459d74cf8b23d051a38e4efa2ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b2cecd920830d40e4a6548748b1c950d3863b39eadce0624305e8892c494f59 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdd63f5034eb7783a8573a9557b353a92b4284dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e55dacdfdc08216bd9fbb6c709342d2e9d42939dfc54669a7cbd2bdc464002e0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51c3ccd002a1eb0f0f9fe9e1cbf2d470c9be05d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ee21b5e5235c1006e1fa4308b7dbc28de06f53b1cb2b730437baf82f1391ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4781a84faba2bd19ecc0d6cd748f6a604b319823 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f060e932ca4a0349c3611c66349095eccb24b2752de5988b3fa6481fea49752e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3fb35c8e3dca947296ef631e85addcde016bdbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31154bffbc5bc053d28f56d81d125106fc15ae93888c19a113170da82b8fa999 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..210e8293a8fd05c987832efc621fc7d37f47d121 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc510df9f1f40d0ca2a334f438c54a5a91d9dd380fb3c12c5439e38c0c920f29 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb49c2d4845544f1ee135016c069a885513858a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:736ffc3a280efdbcfc267cdec2b3c9e8ec6d69713cfff89fd7fb1267137fde8b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8be377c35b79c67a4b57042b53ec2774989e1cdf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03094f33297c09b1e1105731191b26a62b52034d6fe181ea55119dedd089153b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cbfcee03904dfb4576e1ce14ca9f014720e7ccb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d565fb1233f38ef8c6134c3cb51fcc147ac4b92cf24036bc96df824389a4fc0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecdb7e3d7b49d89d0eb6f13aa4838934c0e06eb5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e58305192d10c61f24e269c0a3a9c88e39c74aca56864846600778006261b70 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..beff249a37868c6f57f74f433ba2a92803887827 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfb44c945f6f6ac276955cc7932d0cdf8b6d64a34c4fc6bb313c50ef310e87b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c986de31b6ce22730f194e02d50c48363ec5b2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed7fb827d8b555dfc2e55d7e3f0b1b6ae43321df19ca07b463cbc072bc01f93e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8fb1a2a1bfabf383e220220f63908aa25d3e0fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc50b7403446755a7e4bcb43742d2fe70bcefecca6542c6105233965a109927f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9c7a71fb575ee6f3993e62bae1ec46e512c6045 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c95a20bd9313c9ba9afd740a1ccb14d9995fe8865076ce9206717f85165380d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92db21979e8ecad3abcb37de475592b0eb84b732 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8fa9832e64fa766b61dc2ebdd1da57f63fe714db117da1ef1aa8d0ab3ee3149 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d150e8649052c3bb5b689273615d4da231f3d6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf80431d914d05c83558ffefacc886d5c06ac68764bdbdaf852c597fc82e539b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..506efd49b053a222c963cda4ae236e633944b67a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52c9757a93f9d19477bd37ecc954f310bcfc124a23753b021c0dcacea63b4bb4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71dfed15078f3a25de350d2e9127f5b894f7348a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba41d5ca7142d7c8add5d4561a7641c93aaa7561bdae2d834dd2346c34b4ae59 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4ee32e732af2fb194b289501b0cabc725ef42f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea578617c603eff0c19e648fc0f6422ce519ff2f653e7c185df2779bc6f126ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eef2a2e64234ba49896dfb5c51a9709a7189506b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d2543db8f2563cc4411da297ec5bc69dcc4cd47c866608df8c95e27a301764c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07f62d58d7d672019f0c2d62ab1a26b870db9272 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa678b88340647210fcf788602a43357a171bc7fe4d82e29963a847f1690e7f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..205904ad99ca158e9ef6b53e208951876173af2c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e33d5b8560a38ccf40e18863bd92321e06300f5bba30340ebd19f36e6ca07147 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c55329288a08de3d4bdddb7176b9de97135be1f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f979a51144e1d16321d39a8e348a27984948a92ae4835598fea86e039b26ed5b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..377df0056cbb01b3425ff547709453597bde3f4b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c01e22ee03e6f8349563fc09ab5d779cf9b650a73d5b3cd8f9e91f14bc736a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbc0c31dbd59857dd3d601c374fa9f677f308d06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f04aaa4defbec8f8efd19bad411fc5a01900710973ef5dd8daeecf9ac07e129 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..37f4cf072fd77f528556b61f03b0dbed4ea41418 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e517a60aa8a4ff32f482a1bade7a334dde5651193236bb5dc2ddfd2d372ddf6b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0336cf8cb24b849b801a9ca99de290228c005126 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e61d072f40653572b56ac203d69d2825e8c11118bc7f566080f4882fe69443cd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d55adf86ebd5a0f79a8bc69f731af130a464d316 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72ffe5802c7c886d526d3bae70fdf5543bd1b4e8caeca92996dad5723413bc8d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d337368caff98973a263618855d2ba055578f61f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65744ff3b7269e29d4dd2f5e24101e9d33581ed31431faffe088984c7b40c82f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed4c69d21969c60537ab66aad7ef6de339c6a1ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1b60cdc69e71d8668db5747699ff3fa175e980e86142784ef4de115a0390f18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf8655028f0740c2c2577c5aaa60188db307240a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb3b7a73fb61b35f2b955cd4070e14eca86e817d3ac7b62d90acfd885ce771f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38a50809255bc625bc3017baefcc621a8c6fcee6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a92e362a60516494ae9e66ae8aa5a630e2fc1f39753d19b4cfc66863cc979de +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66f8c50b76587111dc2e6cf9f823438acad64b94 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:620c48d2e6d2037214e18438f36f4e49078700de03aa08e1b52935165c18f57b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75c82207c8129a6fba27168d59d4622308b50227 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1852d5f22fcc2facce41278c4180204c6c6c5d2af5dc466a13021eab14c750a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..faf90429d12f1b1da518ceb83da182f8850c6c8f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a056c9cf14a3cdb8974b21f8b956792eca499221b5a16b64cef0dcbb9a261b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a10fb4fd4e3e882d99726d68439e8178412608b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b937408f97564a44551b1e7e1ae4e749ed5c68f51daf1a7eb36e411556d7a95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa2147ca94a5a55057ec2c5f6be0191d451c33bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a549669cb83f8174c6865150ef70b7fec2d6b640db26d736cf40b8b602bd47d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd9de6fbb7d5f0f134654290760a2bb6cba9e2a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69660557964116b999debeec142d3f1222c0effcae24e59117e6da98b9022991 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f6bfbc3409bd2793c0b9fe5d36961ab8542cf4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb9609de09a8c4195d0a0ee0263a26f25e22a84669353b935f3be1075fa7656 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27a3d2773bf4fa448150e79ee87aeff76724c216 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7106aac51c68c4970df8aebc57f4e0d0c24ad861aa795922e521cd95a41107d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd7e0c716ae2bf54dc20a5b54e6500c82ef1ea5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e23ba7024a0d0bf5231292d868d49e3cbf52fb2a6810fcd6394f1fc0700067d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0835b88194d4fbf3b5a368c742ffa2935d7e3e9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22993c6e51eb9d95399771c572ac3b6901d1968040c14bb255375cdf8507bbd7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30bad0816a1cc71044a5c274658b005ea6d6e707 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0c61be0fbd74665d41dcaf643b06c4a91793e94acefdec3c48f24d863685fe7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bb02926d18a3d693dcfd639548c780ecf6bbcb7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3eadb8eb6a5b2a210883e8911d9a68e86896028e9f4152787e07482ff764f7a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab259bdaf8f069752093233ca3b99c637be62233 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2617c1179a47c06632cedc3031fa92926b100362e80716283cbc02128f84966 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..43962a2ec0cc2169221db4b9b31842985603a0f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c96451ac5f8b0ff471b2a6d963730ce2b7fe23501f9170a13677fa57344ca580 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7a48627857f22eb7d0ca8b95673d233a9b1b7c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ab6eb6c7fffa139cc2cf40ca11c75a3cb0ba5b80be1d68a30fd57705f996fcb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d96a1af0e455eab71e2304c11f80300de271edf9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0547c1760ad5f4ea6570dc579bafded0c67dc3181c936060d0ca5bb5eded7f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..042ebd93d47669845497e1a78f52bdcf11336420 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89b505803296d9918c7bfd94e396757f5e6be59d2251704139a947b4c03d0bbc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e9f7cf65014416ebf05692729f6ec4ed1b4da60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c67fc9a21b1a4e6d22b487e5778ac2048dde4f7a9c732533326de29c58f85c8d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e39c7d6372d7ececf9daf624dfafdab26a8f5c82 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fd05343ed9dca05c38a176c4c060030c293d064348f842b91160f3899c7a8cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1fdecae086e914342b30d1b78db5e22847fb49c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:180b2feb7325ee968e091386c2691a848756674b3fe3684fdbc6e4fc8eb1ef29 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3251f10b7d56684e3faccce3ff95a99a699ab2b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82327d92d38a94595401a562a64f6808cb25b18520465456b67ad329beff9a0b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..66be06a101362c78ab4be9ab342aee21ce5486fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af2a318ed7fa08183274014426c07bdb2185e8144802b3f804acd4b10b9a8bf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fbdfdbad1531c2d2e3cbad1d29c7263921c981e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a306faffbbc44c6264907e038da8187eb14767ab57cd57d104869124a8d6db40 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5df46579714bcb88d7fbc5e3d47c876d57f546fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e63fa78c407f9711fbdaf24beb70109414806f356a6015bc33122c6142c84f0c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bdc7f0b763689a87dc57697277d70a95ddbc500 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:675e4560234d1f0444950c9acb7e2226ecd2c6f425609d34edb57ce3ccc72bc8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..faffa77eef78c135ff5359005e0c0b79e2e49e7c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b655759682824679fb91b2ff1f895efe85ecae496a27e7b85c48b9a56e2cc97f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d344bb9d64baf836d1392bc5c22af55d9b3becdf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40a551755030acd4a01c470fb360ac856e5c027a49c6f96815fd304e6f1fc1a2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..380a7391a52e70d43e9ce8a41f63756ea5f4ce8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:886a0238f0c8e8169b0a8245d957e75116906f9aba6901ce4bf98c90cec34db3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf1ff131feedd10165e19d6736773de64b297b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:710e8b5049cb93517dcfcffa2057e27bd1e95a0376bb5689f922b13c0488a173 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae6a120024e7d1e17e09e9f99596604ab107291e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46f905f047dc07af4969a78f1a11e09ae2d1d4a289618dfd1aad087ab26cf1fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa5c5af09325ab50ea5e95a42eb1ef165f2b15f0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:958c412b6aab4935acae1314b24cd941a4a7d8472ba4bd9b7ab44b25ca71ec90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc3ffb7399bbc3b422e96086573adbc64a79ae97 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed3c35b9928630dff12a65f3915de3664e78412f6a472db11d4ff243ae4f757f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d07893233d978bb19b8b1bc70bb23da36d15987f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f951e283cb9b63bb973ae16f6a00518c380362dc66df1e5f622d2d743f96deb9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30882bf4a5eb18112e2c4f3b4483c906bdfd21dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c6766d5446c7a271ebfb04e923ea81f8c27ef6787743205e762c2e107e2fdfb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1156c5788d2e916d6c9b9b0dcac940b26827b2ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7373e6f89a46aac3e9517fecee1e2a5d0f76918b4410361a4ec79c580c24393 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3a1bb064c774f32cc21fa954ed0b195593f7548 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc70c40bea0bcd3bb2212b5834d571ff059fabd738aaaae45d83530bb27a8444 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb1d9f0d5bad00d0f0984432f53f68834cf0a2d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4e3de9b7f235438329910622d98e47e7ab45556e46aa44fd34cdc3263b70442 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e64cee1a50a7333ecf787230dca836b9372b3b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d653a5410eac2781fe3caa5611431b9fff28e7e6356b4f7d04127a6f2f75a06 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f66c2629fe1e78a6c39a28ef947fa53bc22d092 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b47da5cd0c84584a4cebda4d155198a80681f292e348743c333a005c28e10197 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..834528a53b5e519cd6595f4631afad545362cba8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cd6ecf859498923fbebbd0161f0ef43c725362a78985c18575b03363d462dca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec5bad275ebf3ace52d0dcca271a43f0e5105b47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4cc66e533976987ced906e17c0576b950658e5739660673308f527d1b32904e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1441b3b51e69448354a337b01c9d3caf94d8760a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d626d39ff8cb4a4b1531097c61220dcee9ebdca6ce35d2acd9d092e1e9b5741f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abe76204484ef2ee722519a94d0cb939af64721f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9edf0ab36dbee3d1661ee8f4ff94044e23a5a4d428099937b3421954f229919f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b15e6dcad172e747e4b7259f70865997108a0a58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:404a95fd3b3b0ef9b37fe3e8db0b7eb6d055c9e4686b39c44423bd243e3f9f97 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8e7342a90379db5199b5519c92e161ae6194348 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:176087eb9acb03252fb2bbf033d4642241773579a93187549c15f8f636bdcfe9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d399fca3f49936bd403e82d75e209c28ef56cb2c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:676173ffb69fb59e345de208fe6392fca2d9ee763af6ad02b4b15973fc5675e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63cb63ff5516495e5f1fdfb2c16b39acb3cafb21 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5302536a02113f610fc79e97857b49a9a950a59cf382d6a0f6d1677ed2a5528b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e65ca28ba0123287c0f332a26c02e4c7fe9c9be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62ae4e4bb7a537ab21ca456d1943ed87f5a4fdc4f7d6ab5af70743d4652515a2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9184200df68717ff2261d922edcda789a8bb13b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb99b1d4e5e7d40936ba2a3c5d6669782b8483904f321ffe7167e533bba1d90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cde7b1804ef01eaddf0cc257c44103971a8ada47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce56fc39649e2beb100cda5518d0827a52e3f247afa49e4010dbe77d9b2ed259 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9ac2c1b26a7600b5b53c629a09c6c4082501f10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dab09fcbdd75f7fb4276d88a0ccb713ebfa297ac1208db0303404b9ba7a2d79b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07b4b4544ffe633b198bab18c66d9072bd752e14 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d10773b6e3c9ba290dab84c1236efca330de38cea67c60a6896c0b4dfd02152c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..580a274dce5f70123913250191a9a4a19ea60422 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2b16063e8e26781b54104d81de351184e490a815d0a9a4c6714717bdb0c5d4d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..10a0631e120f7086c6db63f40d8a7cfaefbcdd90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e83ebd4f559f21c706c6d714916f55961b2c13a01c0b2c710380525925048eab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f7b46fca930658bba1f96f6db32be507ce10296 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b192ae503438608d3f328ae393d74c48db5b9515b7c71c7a4698276febe0b11e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a999eb47ef3df742775e836cb080fe347149ca2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf0ba3e447674e478b46e5404c00ca15c310ef2f7750a7d7f818da4e9d39e6df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7bf943176d30873b655b45d8db23bd244e06d86 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd7d9cd59869eb807d6303a7fdd8375a8db4b215ed6606f9320e6eb59f7907ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd72e712443cde2b2720901389de6ae604b4bc9f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa4438c33bc216c13fb8980a545c18ce36efc9bed37319a13d2ad2b732d60c4d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79fc2b2c2e30441ff5dc22ac0671315e66ff5aed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a43c1ee2e9f43f7a9b067a9d8be8ba9033bbd8199bc561d90976f2ef644a57 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec2dbbfcffd71bcd3e5dbaa86f8216cd4d16fd88 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa993ab38c9e09dce5b5a038a01970efdda46b0dd7e24116adc264e59403a075 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e5f13fba92cfa22221b4b4471be1988052e5dce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:248099f20a444f6a04586048af041068f5bfee3609573b3156ad9946598c9b3b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc69b7af13c5d3833f2a9f3817d7102bd4ca4331 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2375d845eb8e22175c7765fae1db07bd9ba3bb06efe9a76b97cf64bcd498e926 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69d3bda52298c1373caaaa8a17adab736da5fdf5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2de99f1a686ad62ad6cd26a32ddc87be9519957349a1a41e863a7a9ae9f66e90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6df4d5451b866e676952be3dc13c17ad09e7e78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37692c632776b7975808ba06b443c5de9e3ff27c195f38cae1a09dc0e166a861 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9a5709cbf2ae88308e284962a1f9554e1807f18 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0431a5844e75c0e31566a65a42ff4bf3b1cfe23c5b9be8fc63b732b8648ff4b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d7e37657d161f1e4ee8d032a12374bad6b344ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e44582674f08f9a4dc6c1e621f41059ab64bbe42cff27bd802b99576e2f6f5c8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..013e4b77d465f493a5e87e62890ae58ad78041ea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bb01f2862bd346163edfabe4793522e77cd53bf0e86674bcc46c661ebe29ecd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..200a7ea8b68113d728512c63b4feee754cd347b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f42cccd76f89a1e84ec8015f594be95709932e7a0879cbc115ea43d558ec6793 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13abad1a5ed58a398671fd05d3c3e4a3237edb92 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d25651a39ecabe7218e6d516f0d2dca3cfea292dc64bd56ba23a4dc6ca290b1e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9ff2b0c280611d94cfc7b3645fb824ee4544d7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07ea138138cebe8b4c207c5483ac5d4388decf1e9e89a7c2c1add8fb721da37f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..353dcd14a4c189774b8e8daba6f7c7363b545989 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0536fb2f32f43e774f19dfd64d702a47853fb114d84c608ff8a68afc86b78ecd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c688e28ac65fbb542e62c03c10e512add77b54c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df5285e4e2d3cc1f19b9ca6d7094652de9a23e856d612bc4b55fb044502699dd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c87ac0aa48ce78596ea32b498af4fb18bfba6bec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9017cb0bd8170ba1d6ee0668b27d8448e9c3f1dc8bdc230061fbfb9b2cbaee99 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53db09010c9ee815aceda05744c5f08df17a03f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:446faafe472af7ce242c8217d78f6a85c66b397e12948a192282093ea02a1eeb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce2e6d96d45cb6d720842b60f13e7599360a859a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e6e61536939909f64ea66604e4a1095f0fd89eea7a950d89cba01ecaa08384 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b834dfdebd7c49616eb8b06bd92de83f64d56e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2739e3121b4d0699391157528000afea887adb7dfa2907c0a4ff9672f9c7d8b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc236066f71442cfbd6a25fd383b961e712925da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fc7b1faa43e2fbf259c5622879388e1bdf09e09af214b1498112e4375113d5f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b526402b89ced4193bbbcd691f4d2111371e3e9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f49b5e3478618eab21b35d338771c17d70b7c9b001b1a55f46e028be3761e9ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c152c81b144c00adb635898c5dd72b3284c24afa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:785addb126772cdf7fbe90777b26176af067437536da058f0b252d75d5c90379 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a2e33dcf203f7599a4badf0784fb1927c0427f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52cb53d60ea0314090cc07dff626d5aa5012efee8de270c0608e7bdcc3911a98 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c5ed3fc91a6efc58e24aff4b4e4f92d978284e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ccf1fad0f509d1795bf6404791e08f6168b51c83e7b1e11e4efd497ac38e105 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed7c341986551be8b7fb5c116addcd708ee666a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d856ad69de0102e7bbd2368a5b71258f65d10cbd552fc9972f12bc09360cd608 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..653346a1c8b684fb18c9d17180860293a554587a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:527bbdad97035474f2859f8136582c8c68da64f0fab432d8f4fc3572570f315f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4c7f1cc07ed9a44b547dbaabb080c68e959f80f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb065a93252b4b839992b5e2ee7656bdb08d471fa679d177ba0aee59ee783ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc961a70d84bbe1d8f7495b4958c1cf9f07e3be2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:149847d3f0c2f50ddb020822a44ec139f21a0bcac471706a29e2a0b1c1eb459e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fc612e87590d9071c74ffbbcefad57b8ccdbf16 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d09a0d1766af9c3098f5a05fef9c7527b3484a03b778fbee29496748e6a03e5a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ada68871f22e6fafb6d35445c0508f94a7e0bad5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da35dc4ffe21cdad8d027b20403e26d02515390769deb942d063adc5731a2389 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96050f5baba2ae4ac14dedfc7f234b5ca114d038 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca9ed2786a613cb05d817fb52c40df785cc010fcbe0cec57a7da63115bdf3ff9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49070da8ee716e15b9922fd27dfe1c36e340b37e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d95219e5f90096c37f26ca73e0a1665de30a4d3aeb7b8b40435261a6693e71b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9474b2318544a196e829f52ed08aa1bf45e4565a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f985ca36fb3e58689afe106e10e3601b0494baa4a165a61c859b5e3b70a5b6ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..320ce8abab6deda50c8679279fc356746af91c0e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f769b2be10c630c17fd489b79df89b5f156ace191cbdf379e70ed33254c91412 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1135adfac42d53fbb56fa040e3a9c01733bd948d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eea28f3d47323d300d64599e912b9318230dc2984141e615e64f9ae5e21f4d87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b85d30f49d490a78b141981400f38c0eda193cde --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51b33cde679c8cbf1eb7df12dda2ac370a038b06d91d9814553dc334c07ff6f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a31c6426ed9d08abb5e5a2b3ec5d56c5eea9ece6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9991a483e11d236ccfd59fbded4f0ee6e0b9431aa7f97475f35dbcf92baa2b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f432518406ff40bf8c2ce923cb33a15aa20d2d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f75f37357405a85cd5b5fe55b7d57aa0870e374013a66752e591b87fbf0f9d8d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b024617009c342d05b81c2ab4dbf34be23159294 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:170ae56593f87c74a067c87d00891696d6bee18820141594d445c7ed133794c4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d775058dbf93f28cbb9864f3e14ee4b94c1b86eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53b54c489a629a335b7f9bc51cdeec3d7bfea7147d371f0f21631500d10f8040 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b44bfcf8ab62af5a62cc90c33d4be934d1f98a82 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6af4df17cd41a5b5bb8a5ec3c7d2d4763bedfb8d4c4db65a77f3286ad5050b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1165c84603b995be565b1b82c63749560b3a230b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:259d44c86e56a8acbde178936abc1d645b2f3e589a5c80fa9cc2ab2549b63765 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd7f23625ebc5412f88a022ee293609371ae3df7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1138a7e79107c500badb9d08fa5b6b938bd4c6ab4c72e7f694232dec2fba60b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f4853bc138ed037daa4c2c087fdd7b04ac0b11c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:156d1a85e947303f534d6621e109f992c96347c583983381328467e3e71c7c36 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a598b7cd06e88e4d5007f7ac11bcf1b2a24e390 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:453097b4539baed1501de1241d363be3a5ca2cf802180067d7e2f5868d9f34e6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5c2287bd8feec999ae4a0d6f2d93ba53fe4de4c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d16089a38b96663b16a04e7f6b3d09626c89a37b5028057053f4c724c1606b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e05fe24df62a2e0c45dc11364c8fd7d26749588d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:666acad6a12b07b839ff1e0a6e90f6eeb3f3f65fbe343cf7d1f18c5762cbc2a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bd83ee7eae06d6dcec33204607bf8979ab1e359 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ac25f0a37f6b4ce9f46a3c250062c6014f08eca797ac4ecd244d4ada28759fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef030832c874b928b0c1c0e36121e131ef1b733d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d21b68de5edb8a282b592c429fbbba974bee8a5a7d700a6dc5dba881102bac8c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e18831b968768d7954daf21da28feeefaea57861 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e1b05275338eb3906bb6ef69e3292c74bc7f0f6d9f40d9dcd2645438cee9fa8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b27b654d84aabb1d5bd23f3a6a27e3bc98befebf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea55b0cffdd16027633452f9590bdbe8e7ab76fdac5ee0e0802013a565e0f87e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78f675b1b712380766953ded88a327ec82b198c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a88be3944bff3a57b9f5b85a3defa834567b96b1471b2b410d0fa8328eeabd9d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..97e900bc1d47c4941f243d81c55a70baed62d2f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31f0443dc281b741521e14a157f4cc9f74eaac896284045636c35cd1e20c384b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..845f6dc222674d7982e83985531cb03622fdce42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff48426c11a9eb661397eb6facb9acbcc68b71fbe0eb4d755ffdfa3fb335114d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d52103531eb6b0542668b540e0f915617162e5fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6808af16427228690502dc909fbf06629db795161c7bd165f8094d8b8bd50b54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c49522f4762975df3d26b61d8f2a9618b2cb2307 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e9ae31938cbc77252e921ac86aaa6f5f485d90606e4473f619dea00e0c5243 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..289f0311e6a5d9ce745072a23faa4d3c5ff8b0e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a6cff336a88a4e41f49332cb296aeae5b4a0ea65c7d0fd5bb51ad8f18502f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e97617125db3e980329b1625cb51df60dd60871 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c8753a3f4d141517e6bf2a3e3f88f44bb844049d932183b2ae31954e1d6663 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f2ed9672f54a175b1e1ec091a30bdc87063bf28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31c2f93017596743e94d9b62c87c503c4a1aa666b1b4bcfcee215d4a9281c8ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c42ad9add6e93235ddc992d3d04941c9dbb7288 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce58af1e9fbcbe1ad9b721ba3889a835116ba6c320559032504fe0ec8fd056cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1564fdda45f72b11c9dfbcdb7faf8e9cb34d7de0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dd4e4c7f207fa877172cc3617afe1a3b4e1426b2cb9e62f5a63956eeb3f824d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ba297d84373e1b05fe01433bdad7bd9421e0043 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6aa46b5f1701dc0ae7c797ffb90b39c01f7bf9db701cb64aa4130b37c8a43b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a672cf5cab5b6e6dca8be081dbf91ffc0cce7efe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44f17d06b383278f3b602098ebac7c90e57b5dc3cbeef4f4a3838b4e88a98753 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eef2a61b731b4c7eb08b0b2a683df8c35798f7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67eaada33df6006d9c8d5860e881852e8ce313954f0bf47555773d0f3119d3b3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b17642739de5096dda52a8554fe143e0656717b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa6e9f2f7fdccb753153d67e9ea60662b86b3772a09c1abdc186d9c9571093fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea91e880a8892e43018f5423e5731fa579249f34 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87a4dfaaf22d584a5a4782c77f02a7158631679d86f1ac0b3de8958312c205b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdbe018f05612b8b0cf3474663dc47b5fbf72184 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:177b88e68ed4b080357e6e6afe81c520c031f4adfb775183bd6ea6380169ccc6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdef363d5e2f00a08d0500826930cf3411ce046c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be5cd2f957e6f0ad0f3812440a8e0b19a5c783e4509aadd5b4034b73576ee218 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cdb48ee4a3a6a6af848fe627aadf6ff53cfe63e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b2ac6595c32a8e07742b3de3036ef39c93ce33636045397b5907d576748d55c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d65d63dec821875804ca690a9d892cb065257ce4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:166a3b5f8ac01ffbb86a46a6cf2f75e24a6748221c631a568e0625ad6ccb1962 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..97e8e5b5f07575f0aa4d70986654feb0580b3aef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dc028aef6f2243474942eda645e56c4b6469c50dd567347ae8310be7d89274f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c1deb1f41e289e4b680136a7541bb7636f10b7b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51312b0f2485d86dc1c041d399ae42f0771987e048229cf8913c641284c24f9d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3d76fbab491cef65eb261b642480d8f10b0870b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf3c66f8f972cd706317c210b9d186cab014e8443b650eec6c87c5792a8bd0d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16ea54767ba41e48ca53d74e46098a3305f9a585 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adab6bb5d42ecef917f3130208f16a28b50dda166d8f669f2ec3b250a83aa934 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..78cab784a57710f74a20b195f3c13eedf261a5bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d6a2b706fe067039fa4307b584973f9bb47810ad3437275955acc4ea61b0fc7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ef59ad2993ddc1dcf107aab2436dcb402450efe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:424af9c6e1c9f0264be76638a8140fa5cffbb7652e2fde3a757f5f5c188fc997 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b008874227c3d497268b0736eb7465e8e89ee927 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:033568a3541f3e7c326cefd6849eb618acd7285ca24dd46b38547686b2831c63 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a72534bfa97542518f92d7997cbc35392014d364 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b3a0bcd4f6fd53c6a91ff90423fa047349824fc066e70703df57d0c97864e93 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa9865781a85e9ddf2eda7445671fbdbc1d59b11 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad43127bc57a80796c97eec3ce50830db686b45c10628dbcfa8ca29d4f17637d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36162afae7fe19039b91e9dd43180b509cac9b43 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93a62df477a9314a7e7c593aa5001351aaf23152abd630d5728abdf6ca586b69 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e287b0d096e9ceb2df09e33e6b11e47a6a91a920 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c68eaf8bfeb927b257574bc7abacddb70be0df5d3cba9b292c70010fc9cfa8dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..821c9d3aeba36ab3e938166922e7d604688570ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d64c3b7953f1d9e0f20afcc4fae383faf36f8fd5fbc40f294c4e5805c09cc00a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ba1c5ee2fd2777d946b898738f134d8f32df1f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56c1950532866611ad0d07ac1a5be4c09922a53958c32814f57da123e057b2bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..179f72e419ea3e719b886c8f58c950aa2ced6188 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d354d76a56c1e2c984f2a047fa2e3d4b91bb8f54682850d5cfbd2869d9118a62 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..21af6dd0a74f051f0d7b7464b9de219dadb3c752 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79bbd37a2e3c32ff98df38321ead61e86abc35a21218f24b86d06035b5a60168 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f14d4e0ebeaf6905a39b7e79967d07de9b83d9ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ac057e5f316f9a81a3ffb3d2867be68995599bde3ea490c5bc08182a31c01ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..680f598fa533c0e09ee4247e419d3c103173ce3b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb0ddeaaa6d1afc57280549ac90a1aaca0040eb328e7390cbf20d0654065439b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d239b8d10e34b394adcdd0d4560cec52c7bbc60c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b4dd9096dd5de989b7f3a2b187746531f08e35cbfa5f7260a3031794f22a881 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fbf5b25275b2119d17e2278e3e022586bda88c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf6fa3da6a4abaf583b5f9d470ef07f695a579073affcffe9c4b25e78decca55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51f74fcf1e8e9da1883e91fded80aff3af3bbe4f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b073b54e1b7853ee50893f498dc149cb97e8906913fb7a1ea5c536f00b7fd47 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f0ce2b2ef84d3a54ef34cfa16e4c62bd908f6ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ec3c024cf55477e46a46327af6beac42acc95dba0b11440cf890cd61b72f442 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8326933742a3894dfd57e150b8014c87c69f3dd8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c41f95ce3f717a9eaa69832701aeb45f87f65d198a8311ea82fef4fc578bf32f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52fb2bef15b90e7070bdd1b1d406b569b0246f73 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09242562b7e9d89deb5e7acd938cbc90c7e7b93a302eb2462b3f96dfb9658bac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cac36be00707179ddf4904718ba4f950d365f14b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa548ac964981531e30b21e5c2a44005c3e272e9dceebca3ed4c4453c811ea3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc3cc1ea755faf68f1378ccbe7a3bd3069ad4ac3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:771da0cf054b091104f8b82b9f03cf7da30955935b1f397ea50bfe6c03baef0f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a744b1372cb656c496f1437a2b8d9178cd0fca9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac3cfc1e64c53fcbcc3dae9742963f442dcf31790d862f2fe701c09e335a3c0f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..44523f30cd155702d34397e782aae78c109e6fdf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5658378b847cc454def46c9e43b8e77282a2bd820795429e852ad6a3e09078e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b0d61d1e07298301d262311776c2fb597d97e54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01e87e6d09de5af85fe282ec634cb5b1aee9ab9c571a5b1b3376e2f57ef8cea1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c2facd01b85b5833e3a22f2a3568598157066ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977335c39f3f07492c0f4b9cb8ae2323bbc5288a5513320643acb99ecd844a11 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08a829288fecd52acc3d8944796e217845d8d474 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de801d3a21679c98a13b59704b3942248b2239c55a98aec1d9c037185d3b4b5e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c8009498000a1cc00a9614a9796e0390bdabd05 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efffbee0197f92eba0e75defc9b04948887b6c9a8d2d48707cd51f6c4e2b6005 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dda36eb7afeb27bf4f5dbde86273078f5e377e16 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:478d2f786a96849db7a72f97272ec36a67925ef05b3ffcf6d3c957dda74a3506 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8398bd3b576c5fd84eeef803af79ecf14a7863f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be5511239d30cc58e59d2456fc5fcfcfd1ab08f988c55c198a692ae9219eb07 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38d03dc7cb1885106ae461793ff3fcdb075ab219 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ea3354aee4b4d47d984ac0bbf3d5c71186a9441a48300e69b0b21947ea68b1a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69239793a71c7fcd136fb1fa49a02644d3ec7a93 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac7110a4332d274ae16c85f17c4055dabb54f522ffdad44419d9debd026991c5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3578e2c2b4800d380b302c0e7296a1a877529a4e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a56a73b16756f9db4362b1fb5e0f71d8e78b9fdd7f92c6900f8948fad44a9f56 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d352b6a1c1d5452ee813001eb614d8ca626c0b69 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:244a8c65d5fabb2661d889a61dde7681699b148add71b7dc0741bd8c9ef70718 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f99d7ced1109f2402c10daa8bb8afd05adea63b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f617be431c549f03dfd99479a9915b1c44897e465654fb5a30f0320f53410ae2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fd81300146c2935dc49c02b48f39fdd7ada410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b8ded9cc393293b92492a3b78d860c4edde35da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc9399edd7c35db3cc11f2938bb0509f097d7c1a47bf9948768ccb3145d8cf54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..213d378e4e2f90827d65cd21a77cdedb74ffc35e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16980bdaee2b11babab8cfbf40c130becfb7781405386d6e2eabfd0345049f3c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b3b3dfccf05d599717bffa78703b4829040b2bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e37ef3350894ad0ff7ddf1d15b501c804281d4de12eb4278953d32d32e4dd3b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e34d831a57582b6fbc60277a198f8a730dedcb7c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9e50adf55fa9bb18f324a6d0b52f023d82390ad34ffdad48c55778c38035af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c32353a28bdc8df157fefc118e27a401b19c952 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c22e002264553bd855b5c058ee01a20df50326e7a2f9a6a80164cb30f1aed835 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed245832cf2e184f31ddc29f802315b84ef2b9c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f5bb1081a4af55549198072b3cf532b9304b753395e106fbc8de8813a3c8553 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06b276b0a2a4c87704117dcf81f1cca659b05d71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d344362392879d441779f5b9fe83fc5a87f97c829ec9fca480ada2fc62540893 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9379c441eccd32b1fc496cf88d8a477d88b9b74 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167ba7cbf7d78c5554aa1e45e3d7bd5f2581ce16edbc3d856d99ae8f085447ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1612418d3d88abd2e6670a7252b08c11714181ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ddc7a1010155df42f07b1cfc7801c0715e388da16bef7445ba17b76f282fe66 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..acca0bc0f00f49e777eb4446d899be7e38d12873 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cc54c032a4b375582b5a4f8c1b52301de6be6394df268a33bd39a3803f2a9a0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bee9fae426ebc6b3937dc2007b3002f989b7567 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5c5ddb4ce569e2386bc734b66208dfefa3a05adfd8381899bdc065e9e3eda94 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91b608513d5b8b4448affeac5803afe12c730645 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de1db38083a22cef7f2210bb0597a657a526088e69acaa166d1ff4e8fe363de9 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30c6d957b36e302a30eae41586764431602f96e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b68c21cddb9a9030ba0e6cfbdc03e4ebe1ff65aa18e0c15653ab423ae9cf48ba +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7fc1d3dd679cd95b5f971575345404f687666cb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6acb7b2c330853738d7a4eb2badb7a23a532af9e3982ce9a1e87f16c56b884ff +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35fb33620d9178c4ba31539e0c722ad39cf8ad3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aaded01a5429e63649b26b3345c7a92be50200bdb3360c8fe84c9e7418c866c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8c8d07b774e524169bdc58c7462500860e22544 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d8f0039334f7835c3ac165aaa67f54915bc9fdca3d4c90c7ee917d2ce1b39a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92e8e0985c3179380d0c58f17050202e7507b1fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d22fd388fdc29ba5d7c6bd8925a165fa4680dc2634c2eb8c569ebfc3ed3f70a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5467b07fac5995cf9f75fe5c628364314f1fda35 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43ee5802da058772dc4141ee4b29fa04d81386fa49a414c4c8eb5fa479cd19b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..090daf0e2cc122b95b2a84261a866ef6582a3016 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66ed43c565dc73e036c1e0d71b283e55bc4f28253603f6b19b90f6d26eaa93b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abca3269f685bac110b7185e12021dfa71420903 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b7a07187138c7eebac424506f4c08459388a6a776d9b827f55faaaaa3cfdb8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dd69bad95d2a3905d6bba85046cd8d8172c1f8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aac7803fbd58680c132d111b62642b961361956dec22de80bcdb66d8b580142 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9be70d7ac6786fc95efcfb53a56560c0fbf40fe4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d0bf1dc8edc2ab33d8aef934de7fb02f9c9a1b6526b639eb3ce12d87a1e04fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b622f40185861f686357ebe10c82a7152a39d59 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af5e87485dd1e84e69d28e5f06beee2abbe34dc72f641b610b254624856058fe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f32994f8bff29006aff3675f18e225c8c004dd23 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02ba9828b13ef26ae7b379245a4df141c3efcbd23ab306a684966b1f90e0a4ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de2c7fba76839569267a6735d8a3db24984a8ded --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66270e83c8d54702cd5bcfb2098b989feb5fdfea6abc33eb2a7e8faf939d98e4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c4f33e68c02c0c78500e2333ff176572b337fba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:884c927930799899f64b0d19a45414e180c7409c048b381a34f79ed512d3c2a7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e161eb415ee52a7e49e88c92653d391482a13d11 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef352ef3dc04af4532570195fdb32d1b9c9d22c9fd45a35ef16b075765c6b1c5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08cb483b2ce6bb6f232367572cca30b29e72ace3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d43a38808970692710d883ed2ab1b180afdd337252079ce61a71263d4a20323b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a05ea7dcab9c98382721b53e26db59dd40ff6a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89aed12ecf1297be0440fe757ec65c3caf8efd504b638a7d9881c30837396ae6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de5049e8d0d1cfb19849e835648d329054142d94 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15a289553e5422be03ae8b529bca8cd570b7e19e0013ef0e1aad5a3633ce00b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40786fe52f2b6f0fae9efc81b8ebb0c69e6e30d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:741f62050d7b981575232545dc3a37914e22c87e61ee302269e5ecfbe792d58c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ab6e945513b73b394df76dd317ce2dcdf732c8c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdc894acb2c008055319d284dc585e5e05d1ade679233fc85d108c42eb2087f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..14b1e66f849aaa2d22a995f24765f308b1b7772c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977f686229ad42e64aa76dada78ce2930a33ce9cb5e8b79892b0a7915daee779 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3bb1dbeff90fb6a32b26a7f6b6cc29084878f6f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e508ad0aeab43b48f22029087b8156f088148f91d8c4cff447a18fe4dba3bf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64055840a4ea92b6e86c22d64572b904b904fca8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35196c94476d75a92a82f5941e265e7e3b5bf0d688acb19d2cd27ce4b9e1ef15 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d70b96f4bf8bd8f6802b4761a9e0f917d83464d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c961da5f78bbf0b3450192ecc4d038b5c545fdb80e697580fb3c7990a4a3bf12 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..02eefe64fdb02c04b322578b608b0d5e93bbc59e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b83082fb1c06cc85aff78fd48e8e7f4f0b611c5bb75e88b408b2ec6bc8d41b74 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf5be46e55db5c1b7ecdbbe7d72031ca44fc6d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:678ff7c16e7cd1f9ff18acb0e8e67e8568a586eb64d8f1266fd1695df6f4f764 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b52938c6e05b77762470426ae81421f0be7d655 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73a669db38cdeb0537ae2690bd49964dc9abc909e40af0494452c4b17ea53dcd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..afd1a8e6a1a30f4eebd816605ec60979c4b19c16 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2082aee8adcce3cfae718d6ec66b37bc9bcf9423fbab0865ca4251b22a34d9f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8db683b7e31f0c0fccbbb436ee2cf14424621940 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0d3090e0d2ad049523b37ad3864260982bf2dd923bcb9c67d60ae2be914feb6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffbe4f23a59b4ad0c64448005bd37a7a4c3cfaf4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebddc1667644b3c6a4f1ef279969f47f34bb0f1c5fe8643c5ad98d14a2533c40 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..af7f9fbbb3805355d22bb819135328f82923412e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35e253c43a4c720421345a62a9ee464316d7b313deffc7e700dbf16e0cf3a9e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfb7b12d823e381aa60893b5843078e21599e7ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b24247be020aef3df3bd82536947ac55acd22964e00e62e6a4220ca1a45e2b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69330dbc1ff6c0841b6319720ac2a5a6a0f41ed6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14e9afbfef35751dbb36b5605228942b1843ecf5776fe0df4cc0e8ee11e4242a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d58bd8b641527a16ecabefef72ede10b1e38b0c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be4691128df7958c1cb218fbd95be3f2aed440d1fbe23c06d3219eb64e4756ec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..baf638e46d6ab2cf9662f791b9456a6d9e21b724 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72d74f592dbaf2a78b7134b196f03516c7aad8bae49e1680763c4dab45fdfc55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5443be4140e18cce7803491f6cac8aaa6df6e49 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab43aec1283ea240d35d60f2bb566f88977b363797efe9f209b4b6c3206dcd71 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3309e42de5b764afc761124500509a60a568f3d7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1bb88ff4fc6e052bf5a17743f189cc7fe267c331402c2e2fd0164189e801aa6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a8c6132a16b1aba2ea85b7b12a8ab79c5a8ac86 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93e2293419c7fb38b51e1aa6a4b28479350673d671a887b46b2a25be8a5fa5ee +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3445990e05bad231e2b0b293f097d485d14ffc08 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05f3c7e72a4f130851dd32347036d4b53be235c5df6dfb4fb50bde8b846657aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4966ecdc55cdd676eaed11c76b047694644e76e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8152f0ae5bac31ddb2b377fa89e3a90f04ac50e9eec71ed435bd0d9a050b709 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bd86eea4a7229c18cff9820d9242140199d7c84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf4076ccb551740680adcaca9bd6e42d38cf0cedbd416bde7a3e83818e41f545 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c13c79b14beb5f9caabc311df8a4a82d3b90532 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c34f1d2f61f97ab810ed1ca31f6baa347c53a9eeef3300755d3b92d19523d3c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac9d91001f8e7d743833b8006221de1d205f9a6c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d7e4394d3522539e2426b932367e304ebe46992b42c9373b35512d2fdc75362 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..913c7aab7bb82478dc7b8334657c420e9ca1faea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c10180b334f3933b2a8d11e585f735c8705192a4b04bb79bef9370092989ec7b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fe2d930f34268954d2e1b00b541701493f93eeb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a8bb7ed65e6d9560d4ffe276686e80f328e4a53f2586ad3034c7a021b51af8a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea4030b78eee48f3265bfd4a2cd5a21950cc2ddc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d63816cadaec2e066ce35231a1b2baa58e778ac6c072c980360a33e9c45e2cd6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..045d54b39767a90c0be5e7dd9cf0d60d38d4fd5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2f9bf4996f86066399fda95b32f0ad3a2e7bfc8d685ac9a15cb0ac98e12dc48 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e11d42462a40774364dde0b9c4afeac9622fdfa5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eacf8f7ea897a49106190830a893a728e3addb14fdea913f712f13c47d141282 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9db8f6f63222684bf4ce7c9e1edd60791fcb54c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b3880fe73d3f4a49c6027f23f924ed5618d72d35801491b8beff0cc3e1afffa +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..182b87670d8abb42328afce1549c2703f418a7f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad602f82175a7a90b0d809a914dbf04f532e8f10582c3d48a203773cb479334a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..569da7d75b74f5a5f18f1802b000997bca1149a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21fc8500b0afbb73d6e94bcc9d7a31d67d31af87324c3ab4e9a72ba3455d3861 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9d5bcf3b772d0e88ca786917918f1385ea45110 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cce16b19cfb59a6ae081158429bcd5007a25077de8f1d91f0fb129e78d6ef080 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d4fea742ef05afd88a35172c480366ef09d01c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b66044dff3cd64733b1a09c0da645a85625ff0d4a37c96d39878bbff58a6aafc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c736d76dc29d369bc5fdeddf303f307bb2e3b3c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd51fc2296671fb021d42fc6ec65f70e2751d1f1452103d16f94e44fa052e35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9c83badfb0ff731a266dfe4840e07609b569d03 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f4708cfdf5964ab219dbe7fdd2f30de8c0478ded58b8a2934ecb72f828cfeec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4ca17ac30206dae0058377601a63fd324d41d6a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfffc9291160a2a5f8ef2e2c86d38b72c929da36a1fba8e934ab8b429c08eee7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c18d3c1e9c954ca4088fb804dcdce7e0201d5dcf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:710fce6a803f1aa7f46f362e1031541201db6014ede137f24571c2cffd4bdac4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8be5d50e3f94d85dbfef538928a1cea7b5729e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ac09466e5bdbfaaab857649576c6f9989868486bc5cfd8a924ec80e646feeaa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4ddba9f11f3f57daf9e8f661509de99b1b6a654 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8234c1eaed601fb41ad62336923085830600aee117e030a7f1a2b01fa9838a37 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c63800fc6f2b95a92575c3eb864dbac8f6296de1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ea53fff4eef96bb9f8a1827e287b1e221fd8e3dbb11bf0bdaf106161901a601 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46094d732cab44188d29b4ed6da782d5351c5491 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c366f05b73f3548d9cd64481310ac9b6ad74d6c49ef92f9d14587e0581e98cc1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a2c9d34cb8fecadfe03954e2bcf6b8dc7075b0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9f8ddc638b051dc33c8d9de2c2659f47d2edf9f80c77e2645ff0373ea92d44 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f7941ba39eff673ae4c39325636185dfa57725d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d190b4463ef1ac7502b7b720a2702d79e491c182b9bbb45bb3b88464f1b318d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c2cd5fe290e3b8ad51b611fd5041b97d4504893 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40d3328ba1292e35ff963dcd0f254c5c3c6a13554bc716732684ed4713c0d677 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe0fdc7b3335f3e836df1edd5a12c4e4751f31ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5a44519050a57694e560a4587f17fced5a08dfe570d91bdb48f8852e51bc3d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dcc11c4a2773912284e90221c86321978aa2297 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a2114fdbc7b9525e08534ce09afcfd3cda3284aaa92f63781a1a62949098016 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..946c3c028cfc2bc00313f8c1c7489139224ee8a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73dfb37344bfe6a2c179d22b9fa7a266be26e82aa6fd9ab9ddd91b9ea2fce40b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d229a10bf025b63602ecc5fdf09a57226c1976ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:796f10c43f3205242b56b68c8d6afdd473e9abfd14f33b0db7873104c48a85cd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..573d6149ab60b1992d5eaea1dae23e6cbb804106 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:690de9291fc91b9f6e91c5b288be5c7256d94782b294740c42d70e83f200fea4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3217421da875e56e1d7c97823c5f2e0d788a5970 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b1c4ed510fa2be98976a5809dbb408f3c8fbf010cf3fe1cc8518084f9aed41 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..afd8bb1c3840c25e8f1710359fdb2d9248336159 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5958047c9e99e203fe0d250f571017d8dc72949c7d1735c0a63de848faeff393 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dbc748a7bbcedba6ebf07705114e2efe8ee3514 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f0cc03b9c17b602343122bc1064e6d3e5cb0308719c62af8f77440d469a1c77 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..edcb41ce5259903892ccc4c397095585f31db94d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bb8de3bb4a9362d19407ccc3f98848b48ebdfeb89b02a7d066a859c7209bdc1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a77b5136dc7fb9f4f2b0cd58b355a2f4e9a17b0d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9b8121fc47057242e1e8ff6f5cfbf2bdb67f75dd25c2a1d0498280244a85ad9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..610dcf47a7d2c605b98360a9e5b00272656d9422 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3469c54152da642052dd87cf91b46451e81d9a3ea4d8ebfa931fb643b657f598 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a59be97108ce0b22c8da452dd59d3d27c3d2cfe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d9d7d329f71d1a017190cf5625d3cc9d0303a522b6f900fcc94fa10fc9bb7ca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a377ea8beff1f417d669d56c3beb4634707e6e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a0271e591b8685e2cbd4f87fc107f62c4079211a563f292e8c331c8e7b6cb4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa3300517a171f648753e7e4977ebe83c0071f40 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d55d9f971d7ea705978c56ab85d393bd4d93a68371ee01f992ff0f92c892c078 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1664418d42924264ae16d626fabcdb8bce784b5e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf30934915216fd522249bb1e29d62a608ab68ce48e8e60a9f0406d5ae65b8bd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9b833b817bbbbeb705f5483ca09ceba29103686 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c07c04a70eec4556c0ca2a6e85b1752c3e274690dc84a976eabbd2b2b60cd964 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..010bc0f08c80dd714209f06198279124c89fc83e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24636e9eabe88e5cacd60ac28ed2d9e70b6ca22bdd76f53f6522fa1c83dfbff4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da464906ea42e39971f507ff2db67f319f1a622f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e40726ed3addacf67aa4daf55d3a2f6998a4e7faaeb5dfbbd2aade69a3c1d541 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..85a237081987c9e544be1501ab1d525ed1d80e00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87e443de45e7a60384f66eb5686cdbca3f2092271a4f1464068afc534fca0d49 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3edab31e6ad8ad05ecb5d0bb6f554bbca937fa83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fcce89c2aedf369fc5d13b013577e4ca224ee591d4fb8fc3f6e5782d6771b5c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec4fba847ec50e57cd1f73ea1070ebb02987cc6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a20775fef75ce53cf36dca80b7c0bb4dcfe41ff1b4042c16a33ae58dcb9ef59 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..492957e34fba8d3140b20d60427a0f88653efffe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b75970a64979960dfc58ed20f99d2694fe3865902bf0a818a8a738f6698edbb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..39c465726cf43c20ccfd76b33d5c71b71f70ac39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa69acf441a33598be452d537d11e0b266d99004b2ece904654f0d12f83d1ec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaa916d565abe9b9c4eda78ae7c7b734279e0ae3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:456d990c65e8aab8bb12b1e65ed99084576037992317d9ff22c2d3b893ebcd3e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fe150ba6b6ad3321926ce714f6208a60b9415bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3a55056f50e82628b7c4bf35a7fcf9251219cd9ae0dc773ece337fb6f6dcf04 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68d427c4c13713aea67b52ecff85f452d3ad3b1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e4f9620130b526acc60d02aae15171190800546920e0815e51ef62d8a40a85d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbd1cba611cb8e181ddd8e63c465b8c419d3ce33 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:376ab501b0afa8c49f425cd015834f55dd2bcf8b0755cf3de0a4fe7e1b46a69f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b88b3090285a4549e04b0e9c48b53669895b0b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d24d774a0c27aea0571aca5815223a6d666cada7d95a646b35b8037422fdb4c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d4fdbc2af2202beafb824f6e58b799152cd2e67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6925fb3b10786d958935a3554e93725284dcb8746613359cc172ea8ff16401e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4d071855b2d5465a452fb11232e59b838741f35 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:434c6e1366916c97c0a17bea13b3980e293d8da6cd3c0fd6c2353633b6b94f58 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..506e66181976824adf633baa1f260d3ef651fc65 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:753000f34cd8f467d90bb3229cf934f8bfaeb5e3fdc9b2f17630468fba47e1db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8492b348217c60c79c24de1d323b65744da87e43 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff10b77a54fab8acd39b3d62a253cef5de9a7dbf320584037d837e84e48398f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e971ecfb9ea067e213432662a9cfebc0dd38353f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23eda7df9c1e1dae5645525fcd128c5bd5b05cde6e4478f17f5877cf89f6633a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcc698b7780bdd729a2d096ffcf91a34cb597bbf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8343b0a638d502d9751cc8edb9e1455e14a6f40c8f0894f1d27ab1c7a87f1087 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eef5deb214a57c584b72b593e08a1389bd99774b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eb9ae2278907998979ab4b4a0fa39fe583a33bedaba0a07a61d64cd1bdde198 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5dedf7baf3c3b8a65fdee21be61ac12f184e4b9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f0dc324250b06a16e161f44e3a9244ee4f9595bad1c6621bfdfd150cdb07773 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d474b4aec206c164c15fa3a2d9d1585282fb8c78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:add5ff8540ae4b1f14febd11872b99c04f3846523b90423e36307302613ab709 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..262939239ab237527e87c4145c9fd77d6c2ac4fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf98107bbd02387ac41ef2427e154b4566f02b060c3fa7c97d8fefb868ee9c3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..89564d5730febe9df68131e4f357e897e36ea482 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82da4421a42f98aa975b78317a6e01d6af6ad7de7a6c0bb99da58d3f7cf3ad48 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..586ff097b839ba3cbb5ae91fdc0064b6fc4ab58f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f063e88fffa8776029766b96f66d7395a586ae7102101caa427e28285660bdf5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d95a8b775c21e418deb17b61188e12b5fcf1cccb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7147888e7c9632a10f9505cdede8344209884b479e9b2ccaa5688423c915a223 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f70a14e8bebc0038c8f4f3de9a3bb2fb8a2a88fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25164f20dc0f63bb6859a0d67a0d36350ad2d047961a1e2e496535cae5a673f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..341f57523c26c6e42837f000fd3419f828a729ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621c6264ed7fd78a688f6acc2bb64da037f8083c8368f701771cf936a017ed6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d604e5cec42f2cab9ecf447160e429afeffb241a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e069827866211a8dadc943cc1190dfeb7fd7c940c1a65f0a17c1305efd6182a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7edc7e9367a28af06de9b520a2ef979bcd358e5b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1183a32c6f1661e4b6d249f4d8e5f7a22b24bd8f200b8223a94445a5259ec8cc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1fdfc03bf793b7e97a77c3bd9e9810b91b94de8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59469e1ce4aafa19560860dc1478fa43a51c7d0e6a3cb4258c563e6cc5aa80f7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8059806138d22d597621105d38b82ddc0101c40 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b810ee90dd0517b6711317c13425653cd388f460fd2af2a8c8d6d4f0f9423b51 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bf0a5767f070403c051602476bb430068aed314 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df8e7ff1421bb09df37e8891fabd66e090c44822e4d5dc8ffab2ecd549cf6111 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a7844fe7309fcd554abc6c2eef5869e90aa565a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede585f2c2e42a780f22f3de399aea254639dfb8aa08697e18771436dd622372 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1e526a28111d60771e53b898be283582f2130bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aeef1b89c90882cc770c94afba8b4ff6bf62e63dd6e4297f4b722a49b12df20 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1816244ca7b974e29bd5fb8a576b1eb227d870fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2c11f4d40dc9ad4c101d50cdf738868b4f98978ea36b092758819e02cb6dc7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..577748395aa195bcd74c29df52b4e4f05b1a87fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21431f7aa2a9b714b520780060c65c0987c01d978efa20bf91215d8b2a42ca54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c6cf5d6ba4b27b860f606399f019c1d07572e62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ffd6303ff15d7f337b034fc74a576933629b65525e7b5c0a32f483071603c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec12b67d858113590747673cf7427430c4e718b9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:882296edc3bc963fe35d3e302c34225b52ff10ee32168c7c9121fb23a43da369 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a350c9bf1b80c6e112c92799c340067c151843a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5627c47f77f82f1d1696c0be4d3b794a9b101d4ecebfe4572293acaa1d7fa371 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a13959bc25cf7000728a170ec8210eb5ad9ae29d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b6d7b585ec7c9e38b1855751df6680484dc074b2e93dfac01742e1420be6ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..99f406da48bf774473b6b202f13560c91c474dc9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a5fc540ee6e27e37ff7e83a976e1660c5dad8a6d53ac81c34f9f6570d14cfd3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..150e66410a24d1c1cafd778e2a9b0252596b4340 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd928940147611fc02ea43c25d09b85db72ec9025d1d72c0e8e057b4c8708cf5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e2fd02f7f41399f3aab3cb2501c14fa297cbbac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eb54fa70d535e828be4e4e709a7478962267937b9e88a70375988777ade8979 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..188685eef52afd13cfd8b41fa0eb5a2a81fddc26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b11ac1731806ffa44c3d9bd43113dfb1e5794b5ef5dbe17f2dbe236c5fff3bc0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..78caa0e45bb86495960ae3006bf101cb99a1140e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68d0262f83ea621d7f9b85572e0d3132ee92497ebcb1e50d5428e29cdca0d790 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8bf95790ed678ba0f947971685f10fca1bddf0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a7ab14b46b4990a136877c7fe2f609f0e30f6b8e87ef84c9c807a33d9e85359 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3e3690752878ffea233bcce080aebc0cb291330 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced728e9a5944fc4e7d26a9fc3579e137b99d997fc62ac69d52ab37e1dc0fdc1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33177aac1e659dce6873cfd8c1a1065cb71c257f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1ddcc948698bcb63f4cfe34d19727b28591d542e518e0ca356726ee465bd85d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa183d4fa312aaddd6f613c5f9152bbee76e2a88 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f2a2dbcaa6caa2d2a0b1cb0093954a4dd98147a06ac29ec6bbc43cbf9d0634f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f51dd1df5069b07ed9bbc9e7748d7c721d3d196 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff11f2176fc5e734bcc6278cb5a088545ec5eae2077203c77e939365421c9c56 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00295a0142701e9ecf7607c44eed52ab6e6b5f6f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d2878084d6323a36f82c0c3b216ac0110e9bb3ccdcdaf337dff88851cc71e6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a8da4949efd40155c88a4c48b717990689c5e3b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14219bb7f618ac74389c37f0243d1fe78c8441b25f687dc530918bf6e73a8958 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f89c9e2ca3a466ce48d7109e8dbe873e7ca807fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47ca80bdec5cdcad78582414c923a9dcf295a67ae72ec95acd5761defe5818bc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b630b45c3e4e5a976111170da7a589c2cb32ddf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8cb15e17782539d6033a9b57fdd1fe803a497bdfd61437a903c42fea8ee5246 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b478edf3fdd792053095e13d2b9c8936054a149d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32cb1c2646625a542e6b846fc2107689e3157f21a145be632fb8fe9cd2d947c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8910661607d1cf6406da8c4cdaf4ce180735ff10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bef5185208dc8e025472ede18e61a8eac7f0759161d45e397ef8773f2067db6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cec2a67e737fe731f71f30dc9cf885e900741f56 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e60983efa2eb34b4b1cb3dc9b1959c5b0f2dab6365f2a591de630dc3a500510 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..013c48cbd096120edc1ba3654891630d2222cc04 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee59d9df108bc2b964b2afa045d3e68c714f5d36244afb11de959e9d3b2c40cd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdd63f5034eb7783a8573a9557b353a92b4284dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e55dacdfdc08216bd9fbb6c709342d2e9d42939dfc54669a7cbd2bdc464002e0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..404fdc32200538ca91d3197fddb5e0559b0a794f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8d2640d64040aae36012753e04dcbef770cd80e55a38f6c99de2a2046521ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4781a84faba2bd19ecc0d6cd748f6a604b319823 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f060e932ca4a0349c3611c66349095eccb24b2752de5988b3fa6481fea49752e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..873785fc01c8e08291d7efa6e5dfc0948fb35e82 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b84e169cb179138f27301125a74eecfb297cdbab7da1edc957cd5bd4fcbd9751 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..210e8293a8fd05c987832efc621fc7d37f47d121 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc510df9f1f40d0ca2a334f438c54a5a91d9dd380fb3c12c5439e38c0c920f29 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c916852bbd26348ef9876317d7d90ddfe6d8a793 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b140cb7e788a2678f81efe11185e8443a589ca3b9a20c08e5e78682fe7bf79f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..37a5556ec08b2254735673af3fa86e2e40d7341f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0238583414a3b122c488f33d4172ea7c195fb3ce05ed853c950c9f85fbc09d3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2cf2824be6f49530a2c328b99d8a92ed0e805fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7532f56b674a33775e2376ccca12c3931b7da409a2c5741f9f953013e0d1fc9a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8be377c35b79c67a4b57042b53ec2774989e1cdf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03094f33297c09b1e1105731191b26a62b52034d6fe181ea55119dedd089153b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de15dfe8c38defda6d8a824de61d0d753b74f75c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:321b65148b4cdef744e7be3e54adc33776a641986e326b7c90e7319aa467198f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecdb7e3d7b49d89d0eb6f13aa4838934c0e06eb5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e58305192d10c61f24e269c0a3a9c88e39c74aca56864846600778006261b70 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3298ada3f70834d92548fd51a5da7f3ced8b2054 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc79cc9bcd2db098ce5ef5c339b21fb8ad389213be77f085b3272a226e96baa9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c986de31b6ce22730f194e02d50c48363ec5b2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed7fb827d8b555dfc2e55d7e3f0b1b6ae43321df19ca07b463cbc072bc01f93e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af5a5ae0f6677850b2b7f0418f6498ba94a9de7b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abdd28ede756594246e595b34ec675d7e206e0668664b83c2bae7583b01e9ff8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9c7a71fb575ee6f3993e62bae1ec46e512c6045 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c95a20bd9313c9ba9afd740a1ccb14d9995fe8865076ce9206717f85165380d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fc67307e5a7b761c7ec29649a9f7c1bc577ee5e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b30b011ddddea3a3cf3fd646d6d982f60ca3e89fd6e2f831f06773737dfa4770 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d150e8649052c3bb5b689273615d4da231f3d6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf80431d914d05c83558ffefacc886d5c06ac68764bdbdaf852c597fc82e539b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8c4a8ae131f9203cdae8870431fed625a174386 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30969bbcd3f7b840d927995b4429361f98a1f1afb438e2eee26b07862a8f08e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9038b6872801eae17aee673b6e2cfe1f0020c205 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea044c4dfaf50f36f1d82666fe1c81028ebc683eca0b738ffe4ac83a90ff01c5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..770fe63a2e9a8d8698da66c3c23ac148bbbd4a14 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90ec3786a8bf31ba79cad8b23abd2e8b35ad39db54dd472ba5fad7b2dc04fb38 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71dfed15078f3a25de350d2e9127f5b894f7348a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba41d5ca7142d7c8add5d4561a7641c93aaa7561bdae2d834dd2346c34b4ae59 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b71c77615dfcb3303da323fbeda7d29009c1ac9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cf3e329317ed500bcc25be387d639ad3a55b4f7412eec47d9bedee5840ae443 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eef2a2e64234ba49896dfb5c51a9709a7189506b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d2543db8f2563cc4411da297ec5bc69dcc4cd47c866608df8c95e27a301764c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5260d92c712250e0a846fe23c4d03811f97424fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f75e0ee8efcb029ba010ba5f1365af70672b2b45e9ee4f00fe19fcac678a7975 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..205904ad99ca158e9ef6b53e208951876173af2c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e33d5b8560a38ccf40e18863bd92321e06300f5bba30340ebd19f36e6ca07147 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aea7f6276bc1ce3b675948cb846f420461b30f0b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f464d1d48bbf885dcf85c9a6f03536868e63845a946f34e90d18f9482012ef74 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..377df0056cbb01b3425ff547709453597bde3f4b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c01e22ee03e6f8349563fc09ab5d779cf9b650a73d5b3cd8f9e91f14bc736a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0772ffc588bfc4cdf087ac7fff7f3a24c0c76396 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97eae09da8a65d92756bdb2657f8418f3353eccc58c4639a05142748133405db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..37f4cf072fd77f528556b61f03b0dbed4ea41418 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e517a60aa8a4ff32f482a1bade7a334dde5651193236bb5dc2ddfd2d372ddf6b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d2d8ca41af958c8c5f6c37c83f0a031ccc088d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c59a57f09bdb4c089f0cc4e6e69974707b09fe8d3c7c39f39b45c755434650f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd876d3a44e6ed48f6bcc3351d12b6e9183df28a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8b359bc1f46c32a67a4f593df7bf5708f2647105c76b8533ba354e375547869 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccec1a588a0f36e8a06c159755c29dcb63294564 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3351d8a77789faeaf3cb5d66f4635ed080a83e99dbbd68a95de9dc246c90a126 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d55adf86ebd5a0f79a8bc69f731af130a464d316 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72ffe5802c7c886d526d3bae70fdf5543bd1b4e8caeca92996dad5723413bc8d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9df3235364bbe6d028cd61a510b00db236e38476 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72c2447244f014c335550946cdd2d6adf246f2b116274942119574ac5acde759 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed4c69d21969c60537ab66aad7ef6de339c6a1ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1b60cdc69e71d8668db5747699ff3fa175e980e86142784ef4de115a0390f18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbdccc7d83a2dd3c6511219f8d0efea9ee169922 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a3c4aee57094fd4cdc87c26d4f3c52800fd36da62f691459240d43004ac2fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38a50809255bc625bc3017baefcc621a8c6fcee6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a92e362a60516494ae9e66ae8aa5a630e2fc1f39753d19b4cfc66863cc979de +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fbdbdbfaf427c30da9045836a60b7b8a779a442 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d322a8426c8ae69e4f90cd44749971fd34372d533bd2ab2e817d2b7413a0a57 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75c82207c8129a6fba27168d59d4622308b50227 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1852d5f22fcc2facce41278c4180204c6c6c5d2af5dc466a13021eab14c750a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1981b5ac674b27745cad0683cf9f799379952e0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6230dd7d6a8a508912621ee3c0698aa90460ea1276116b39223d71e957226ec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a10fb4fd4e3e882d99726d68439e8178412608b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b937408f97564a44551b1e7e1ae4e749ed5c68f51daf1a7eb36e411556d7a95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8daaf0760e251531fbf4db3c019619f9962ee14 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfe9ec8289a4179a9076c973b30564dabfb1e5a38fdab5f681f6703199c9ac7e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1f1243cd18329e71158f53b092b7078e91c4e80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4955ca366ad79bbd7b60b837c4c8cf76bacffc58eb8ed1aa67874f58876648b2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51d1e60ac5544ef54a99a2dc8646148757be92f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f1ee8447c31b3bdfeaebfeab97c6c7d799b4c3d669ef92a3f2c41152716c8c4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd9de6fbb7d5f0f134654290760a2bb6cba9e2a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69660557964116b999debeec142d3f1222c0effcae24e59117e6da98b9022991 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72507ccd8175d08c21356cd8df28fc7896ee0bfb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8dea9059db29cfc82b028716e392d848b0511816d8032955c2b7c494d6926b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27a3d2773bf4fa448150e79ee87aeff76724c216 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7106aac51c68c4970df8aebc57f4e0d0c24ad861aa795922e521cd95a41107d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e983c3cd2c8a021555f2e23b849d052fca2004dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1ff2784481365cb4aa874a5ffe30a27430de397a61b4538fc8205e17c80a553 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0835b88194d4fbf3b5a368c742ffa2935d7e3e9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22993c6e51eb9d95399771c572ac3b6901d1968040c14bb255375cdf8507bbd7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbe9cfad8f62368d1c292980d1516da0427f38d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd942ce8e8a51f5248968438983e5e7bb12704907181ebc7220206bbc534870c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bb02926d18a3d693dcfd639548c780ecf6bbcb7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3eadb8eb6a5b2a210883e8911d9a68e86896028e9f4152787e07482ff764f7a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10c7bdd169e0c838ff2f60eb4608703da8a27c0c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84890a1496d09f237a80d68d51d59c43753fa721095f07d2bfe9948f6ed4efb8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..43962a2ec0cc2169221db4b9b31842985603a0f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c96451ac5f8b0ff471b2a6d963730ce2b7fe23501f9170a13677fa57344ca580 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb689dbcafd328189d57df234b8d81402743c083 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b9aa67aee18fbc8500de43584fcadb4ca8e69c658687afd669a754b7b452595 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c006916cc946218d0ee5559f1865595d7076180 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:916f0610ec9e810b280e59ac16f090eceda0234af39fde91a0ee174409368e91 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6c6eaebf721df581f2ba1fe8a76ccb7da319d25 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e4513f63897a60f2711897b39e076ca308b00514d89d6c5293eb9db1256ae0d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d96a1af0e455eab71e2304c11f80300de271edf9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0547c1760ad5f4ea6570dc579bafded0c67dc3181c936060d0ca5bb5eded7f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..089539e8509243637200d7189e7e3a26664d82ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dddb273b0da7b92427d18b8d4e0a5df12c4b90384f2f9bddb4a8500268e122ff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e9f7cf65014416ebf05692729f6ec4ed1b4da60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c67fc9a21b1a4e6d22b487e5778ac2048dde4f7a9c732533326de29c58f85c8d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1a13aff78619c0ef3bb8bbb29257bb102ab349a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2caeb42971951a09ef6f22a3f67f86f6bcf3652ba4d3cad2d8849049cb4c3da +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1fdecae086e914342b30d1b78db5e22847fb49c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:180b2feb7325ee968e091386c2691a848756674b3fe3684fdbc6e4fc8eb1ef29 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bfcd1508d53dd0b91aca3dbfb786a471b70c173 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90892761acf104675a93c22790f3db112531ed78e74b493bf97619ec27113544 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..66be06a101362c78ab4be9ab342aee21ce5486fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af2a318ed7fa08183274014426c07bdb2185e8144802b3f804acd4b10b9a8bf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bddd211e8a1266b9b65d021439944d289db77824 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a371db3a3325dbec3121963834efdce5c5ea032b9dd16e382471b47c3e1ec80a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5df46579714bcb88d7fbc5e3d47c876d57f546fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e63fa78c407f9711fbdaf24beb70109414806f356a6015bc33122c6142c84f0c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..148571677aacf20e54d21d900f4c5a1726008edc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24fa54ff9fe0790b3710be3e036726382fcc38d11a4cca7bc3cf02b239e1ffe7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..17a788060fd22966cb1b5b952af7f9d11faff63c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37601e1bf983f16376c6a4fe6c9e766d6f78d0198c0ee6c92f7eed71a7ecc23a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db6bd933c74b96f726e04848b3abccf31bd86807 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c12b48369dad873986c955e8a518b173c22a13d1a7f27965b244244686489bbd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..faffa77eef78c135ff5359005e0c0b79e2e49e7c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b655759682824679fb91b2ff1f895efe85ecae496a27e7b85c48b9a56e2cc97f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df34d38e85f9b2ff22c5b81581358ec54faf9908 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0ba6f670094534868159526ccdb819a90c6ed5d30bd047209127fda13924d91 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..380a7391a52e70d43e9ce8a41f63756ea5f4ce8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:886a0238f0c8e8169b0a8245d957e75116906f9aba6901ce4bf98c90cec34db3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5e0a3b4141a5695ba13f729bc3fbad2be76e5a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75ea1b9fd675903a373a0ba0c2fcd80624f2b53ae9af882e64e759acfdfdee9d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae6a120024e7d1e17e09e9f99596604ab107291e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46f905f047dc07af4969a78f1a11e09ae2d1d4a289618dfd1aad087ab26cf1fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f762518ceb15fa9e198f9882605f2177266a8ed7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f77471cec983eae1daf6aa0cf37b71ebb556dd209d06a7c0428a826df295b590 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc3ffb7399bbc3b422e96086573adbc64a79ae97 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed3c35b9928630dff12a65f3915de3664e78412f6a472db11d4ff243ae4f757f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a46ecb40e87bc1c848afd7ff5b0bbb674422d72c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8bd3a6b4daf07e863520b8b1d71a7a1ea5d18edb6ea2582af253fcb7cca30b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30882bf4a5eb18112e2c4f3b4483c906bdfd21dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c6766d5446c7a271ebfb04e923ea81f8c27ef6787743205e762c2e107e2fdfb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa880dfb2cc2efc01353f4ec7fb81d654aaf8a9e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c96c45802b155232eeaa2829623f4c032bb204e49fc6b45236d0b599ae34ca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..39608384dfce6c9f8a1225fdb979e9eadecd7c47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:824730d179a45ba2c1cdc0b75c50c3df3359ab85d187c66fdec5c6320bc8baf0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72feef6b5a0a7e1e6c873db57cd81c064f463e66 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fe454bf5f7dbaca2ee71efd8ac9f7dcfb91ad4417bd0e18b6a6892b8ffbe306 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3a1bb064c774f32cc21fa954ed0b195593f7548 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc70c40bea0bcd3bb2212b5834d571ff059fabd738aaaae45d83530bb27a8444 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66fee29e669bdb985e1c3b6ca49bfa7f49a71be6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:987de22871d6127d53c4e1225565f10e4597239538c267e12f7c63951b90ec75 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e64cee1a50a7333ecf787230dca836b9372b3b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d653a5410eac2781fe3caa5611431b9fff28e7e6356b4f7d04127a6f2f75a06 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b180b77c1b618af6563a1b1a4ece947ff2be7668 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05f0eec2e9cc6ae357828eabc038aad514b8d6e8310442aaebeabaa2a7e2fd62 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..834528a53b5e519cd6595f4631afad545362cba8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cd6ecf859498923fbebbd0161f0ef43c725362a78985c18575b03363d462dca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c00068fe99a22b34d4507a99668ee9c4d2caddf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa1f5fa8d16be38d4ba0ac4420106644789f9967786e3fa13aee832f9acdfd8f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1441b3b51e69448354a337b01c9d3caf94d8760a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d626d39ff8cb4a4b1531097c61220dcee9ebdca6ce35d2acd9d092e1e9b5741f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84406c83c8db835441507092d345fdf4556397a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8b3eeab68c6008ea9e9a97f3124aa5852b89440be9ce1a01855a04b4cf3d5ec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b15e6dcad172e747e4b7259f70865997108a0a58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:404a95fd3b3b0ef9b37fe3e8db0b7eb6d055c9e4686b39c44423bd243e3f9f97 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa1254e238db9e96d7b9b2e9d59001c4f67ea8f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:467dcd047710d23add95e7726d7c77443c91af182433331f0db78f64974c9544 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..799d4b5fd88c007a378764fdc70c2e1a20148990 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d1a6d0933d5f34c3b6495454d71aeda3dfbbee3c85b734961b11bab0d9f3a87 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..137304134c12a4b3b6a8f708aa9b0542ba1b0ed0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6247924a37583ea746cb338c1edc5bbce069849e2a6c00910ba432a753f6f16b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d399fca3f49936bd403e82d75e209c28ef56cb2c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:676173ffb69fb59e345de208fe6392fca2d9ee763af6ad02b4b15973fc5675e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d81d6a84b9b6b165df5f03cdd8abcaffa99b6878 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb420da153be2c0de64707a4b20f2a9c0cf45a0dbad774cbdaca09e4efab0942 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e65ca28ba0123287c0f332a26c02e4c7fe9c9be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62ae4e4bb7a537ab21ca456d1943ed87f5a4fdc4f7d6ab5af70743d4652515a2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a10298fef5a18adbcbf673a8dc4e591d4cbbfaa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bffd57fb24affb30006f08de1cfabf36fbcd40818c0b76463bbded8b12b9c7c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cde7b1804ef01eaddf0cc257c44103971a8ada47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce56fc39649e2beb100cda5518d0827a52e3f247afa49e4010dbe77d9b2ed259 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..523001bd42590ed5375bd3b700922f365fe21522 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6da5d38f5a5b587acf849e720b4fa2c7207657c919d255324954122cf63f1ca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07b4b4544ffe633b198bab18c66d9072bd752e14 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d10773b6e3c9ba290dab84c1236efca330de38cea67c60a6896c0b4dfd02152c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57ef22ca9e702b71ff2a2a7c214639ce0b1e079f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4672b946cc4b9a18038fde1b05ec446bbdeca2d4d3b3c0d9c524947425d36e7b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..10a0631e120f7086c6db63f40d8a7cfaefbcdd90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e83ebd4f559f21c706c6d714916f55961b2c13a01c0b2c710380525925048eab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc5d6659a684fe4d3580e88f3f46736510e065bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49fb6ebb891c97670c2d1cfd1b5cfdd90f1ac3a92bd6a2dcae29c21b0d16288e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b2754b81a381921ab40f3043d1dff15bdd97d8a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35fc6b82ecc85301003cb0bc1c408a52026508ef3032bb4c40a9fdfc6df6b596 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..430ebbde65523060ac99e85702bab07f90dc27c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc28fd94cdaae8cc4f74513ee594e1cfd6291300126b07641dec9ff96aafc9da +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a999eb47ef3df742775e836cb080fe347149ca2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf0ba3e447674e478b46e5404c00ca15c310ef2f7750a7d7f818da4e9d39e6df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19801dcb9e6b49eea4a0f29696a84bebd0e0a5d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25777a69c9ed5c210e55f38e277de745c619a3b5cb6828b7f2dbe4eea1a05002 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd72e712443cde2b2720901389de6ae604b4bc9f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa4438c33bc216c13fb8980a545c18ce36efc9bed37319a13d2ad2b732d60c4d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe68a9784470878f6baa173d5105bcf92add8b31 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3af8478341f5b37239a0a534c8f2a6e493d1ba73daee44687ffcab374ff1ad28 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec2dbbfcffd71bcd3e5dbaa86f8216cd4d16fd88 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa993ab38c9e09dce5b5a038a01970efdda46b0dd7e24116adc264e59403a075 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad615667ad1e805992ee9becf872c1f92b81bfa2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:671d6032a53e07c17a7475c1deb064d8b489d3cc675426b49642a83c08946bbe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc69b7af13c5d3833f2a9f3817d7102bd4ca4331 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2375d845eb8e22175c7765fae1db07bd9ba3bb06efe9a76b97cf64bcd498e926 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f3c131e30b3f3583127a2148b36053363dfae6d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41da6fc846359ff77d629f9e86b35f2e026d6d79416ff798e97795b1762a1c04 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6df4d5451b866e676952be3dc13c17ad09e7e78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37692c632776b7975808ba06b443c5de9e3ff27c195f38cae1a09dc0e166a861 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..afdd0d91928c4cb976895b913130df98d3d20892 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22184ca1ec8a5f5eed6f3787cff1bc4bbe9b70f44ff9e69f22dc8660fbbf2eb7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..373bdc6f78ee9c37d22db988ae9068a07858d3e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a9ec4d1e0e32e9fa99738b4538c9ab97a3470736548da2259c8e90f23f3622 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c27341f0bf399a73b190ad4fee077c7620809a95 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ee7c56c254f75cc6848880a3a02855f42a3bad0475ba809d2ca48314f275c79 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d7e37657d161f1e4ee8d032a12374bad6b344ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e44582674f08f9a4dc6c1e621f41059ab64bbe42cff27bd802b99576e2f6f5c8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f448d0ef0846b645e3f338a4b9df4854202d604a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1732c8b2d2ec8ca909a852076e98da1a6897a1569a18f63f2ae47edecfa99a7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..200a7ea8b68113d728512c63b4feee754cd347b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f42cccd76f89a1e84ec8015f594be95709932e7a0879cbc115ea43d558ec6793 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6bc3fdb992ac57dc87b69ec6b77cbb249bc71fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7976ca4eaab857081bcfff7d41c7a10704f6e83342bd3ef308c12b8e850b4c3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9ff2b0c280611d94cfc7b3645fb824ee4544d7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07ea138138cebe8b4c207c5483ac5d4388decf1e9e89a7c2c1add8fb721da37f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21b5c817d881b7be32a4e89decff0af8b3898096 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fce2519f9efaba442745d73f50f06a4d368c061f4996ce31aa19f23f7d611881 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c688e28ac65fbb542e62c03c10e512add77b54c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df5285e4e2d3cc1f19b9ca6d7094652de9a23e856d612bc4b55fb044502699dd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ace3bfc09b264311376608c9cd8ccbfc7af46d01 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e1ff408102a9de0d2250848f62ec6e1114d6f2e5465a8ff29d918a2635a83b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53db09010c9ee815aceda05744c5f08df17a03f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:446faafe472af7ce242c8217d78f6a85c66b397e12948a192282093ea02a1eeb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de1f174841e2ca18396f8eefdc17ace66dd333b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d99b1e54d4234e2e7e87f418c7fe19797aaf18171bdd72701b7910f32b3d2b90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3be59af7d54ddd9e29c1085f42a20abbc8c320a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88af05d6b36ef67c22009a3725a12775d0bd97d2e089ffc066960bb26b32fb62 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85154f58a2685fb63e37fc6f6df7a57437611f3a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30f8c86dddd2d6f24fc6dd3fdd49447c8ce8247d6ecb0e1c1cf730a0fa6302cb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b834dfdebd7c49616eb8b06bd92de83f64d56e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2739e3121b4d0699391157528000afea887adb7dfa2907c0a4ff9672f9c7d8b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d45d92f2f17b43158102ae181815bea45119e58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7429bb396b0038be81cdcb448c1e5a041f75560d863e757450a767a131bf752 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b526402b89ced4193bbbcd691f4d2111371e3e9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f49b5e3478618eab21b35d338771c17d70b7c9b001b1a55f46e028be3761e9ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bf866e76b7126f5b95861469f52508740e9e697 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8676e2dc02c79ea6f7c9cd18cc98efc16d5d9e6c47482ae76c906b8d69cbc11 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a2e33dcf203f7599a4badf0784fb1927c0427f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52cb53d60ea0314090cc07dff626d5aa5012efee8de270c0608e7bdcc3911a98 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87bd8c22806927efedaa8242d2a27ed90f7339d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0906ff278b590c8d8dd32a1e7ee61d08b8bc59a3671fca27a2b19109e574c43 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed7c341986551be8b7fb5c116addcd708ee666a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d856ad69de0102e7bbd2368a5b71258f65d10cbd552fc9972f12bc09360cd608 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b342979d0a8db683da9cc9863c309913ff2c0f52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f9e485afb43654dc8efbc481eed16e27cef154ffb63a6d365be8a030438e6d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4c7f1cc07ed9a44b547dbaabb080c68e959f80f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb065a93252b4b839992b5e2ee7656bdb08d471fa679d177ba0aee59ee783ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5e74ef247cc45c6e95f0a3ba815bccb5720c959 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad71640fe1dd4375ca7c192c275a742a4087f220546cd802772bb261551439a2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77486f1bba2f799c8638cfd65f63e77e00256e47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e05367841de032fc7875aad31eea4323741a536362959c49e30300a75e693e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab62cd7d00add60dd754614239770434bc2dc8e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b445e107adeb22b76d470b4d2aac4a0cb1efe453f9dd419550b1aa9acb2ecef2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fc612e87590d9071c74ffbbcefad57b8ccdbf16 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d09a0d1766af9c3098f5a05fef9c7527b3484a03b778fbee29496748e6a03e5a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..299d2d517be4f24338e7b11737b76e02e495fa51 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:451cdfa621dc4bc198c392ba18cc61a1439db221ea8c80297a0bf428d3805b67 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96050f5baba2ae4ac14dedfc7f234b5ca114d038 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca9ed2786a613cb05d817fb52c40df785cc010fcbe0cec57a7da63115bdf3ff9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a746ec29254a1afa013fc4177b0580aedf117371 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38d09dac1ec363f587ec9c09767a6e141bb6bb3b72f471bf32c971eff2b299d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9474b2318544a196e829f52ed08aa1bf45e4565a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f985ca36fb3e58689afe106e10e3601b0494baa4a165a61c859b5e3b70a5b6ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56d4de52e0a8d25a1ba82cdfe5e16241d9dee0a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbbc1d0d88d131311be3a8b8dee207730a3707c4112883a6d11c21c717b230e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1135adfac42d53fbb56fa040e3a9c01733bd948d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eea28f3d47323d300d64599e912b9318230dc2984141e615e64f9ae5e21f4d87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8aab867905dce55ce06161b9101583e66e952373 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cdaa143297bda307ad76c80eb47280817eaeaba1c225b381f043539f6011862 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a31c6426ed9d08abb5e5a2b3ec5d56c5eea9ece6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9991a483e11d236ccfd59fbded4f0ee6e0b9431aa7f97475f35dbcf92baa2b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13660ea2195971d42b4c4a87e424b39028b407be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57433bda5afd8b6b268d99fb3b34389f069cf08613a19dbc203469976ae906af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2998a8a316073a97464ed4d78d15e94c765a499f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc35099a32da1cfdd293feb13a1e3f6c1aaf7c8c7bc0d1bcf2d7d35cdb15595 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0aa164906f538f79e5ee078a6deea8d3a46fbb78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e04b28ddb718755414d793078ca6ecb6ed9b5047221c8a771d3913ab8ade515 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b024617009c342d05b81c2ab4dbf34be23159294 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:170ae56593f87c74a067c87d00891696d6bee18820141594d445c7ed133794c4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ecce526333775ed04d4206f9be673d1a292ed0f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4e59f1a7b21847a53eb72106ee4fea13f7d77b27fb427468f325966c6ab9f64 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b44bfcf8ab62af5a62cc90c33d4be934d1f98a82 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6af4df17cd41a5b5bb8a5ec3c7d2d4763bedfb8d4c4db65a77f3286ad5050b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5c78590516876218e0aa6ac8353e4cdd880d7c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c02f4f00e86d81c4cc9a35401c87dfc179e3b66aaa19c373da260d41db020db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd7f23625ebc5412f88a022ee293609371ae3df7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1138a7e79107c500badb9d08fa5b6b938bd4c6ab4c72e7f694232dec2fba60b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0812093b482c7e4daecbdf058eb516a0d8c3b02f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:222e0ccfd4871fc3fbfbd7c0f34ef224fb209a7ceb32a4e1e57a1b4cd3c70552 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a598b7cd06e88e4d5007f7ac11bcf1b2a24e390 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:453097b4539baed1501de1241d363be3a5ca2cf802180067d7e2f5868d9f34e6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46db0f547d4b64d0c1d59004d6ed3b783ca97299 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa7a82277bc4d552d9c692266efc830439a31b56f37a31a510498e0db70a30ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e05fe24df62a2e0c45dc11364c8fd7d26749588d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:666acad6a12b07b839ff1e0a6e90f6eeb3f3f65fbe343cf7d1f18c5762cbc2a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e38593e4e9e6f1f6236bb888b505f98a3370d21 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6f26d169bc60ddc5dcd2fc9edac65de55ca88e09775dc29d4b9c2871408517e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd30c6465a5adf0d9108a1fd574ba974013677cb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89f11daadcaff011bd71fd9dc028b712dbb12cbb8f7d5a6f052db5de6cfa1902 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca42a3069b7316243710a8e84d3a2dfbfec03c69 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0538020c6ef50a8ac27540f9541a7bdf7f923c91c0c3e74d9140bc03a9c7801 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef030832c874b928b0c1c0e36121e131ef1b733d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d21b68de5edb8a282b592c429fbbba974bee8a5a7d700a6dc5dba881102bac8c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..852793fec139a3af3f3446823f504d30102a2530 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f43d794d4f8bb479f5248f85dc90aa765d40f3c277df50b28682c87972fdf8a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b27b654d84aabb1d5bd23f3a6a27e3bc98befebf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea55b0cffdd16027633452f9590bdbe8e7ab76fdac5ee0e0802013a565e0f87e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d3fcc8cb2909003224efa8d27463e6b951dd1ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be4a98230120cd51d69750b5f1ee4ea7c3fb6eb31853c4f32d3bdf286a0fb740 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..97e900bc1d47c4941f243d81c55a70baed62d2f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31f0443dc281b741521e14a157f4cc9f74eaac896284045636c35cd1e20c384b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ce8c997df2832f07dafdda2d054b4f878dc2df2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:710a36714865c7d9f4db84133bdb8511a6124a82654e201d82b42f6d4c156c7d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d52103531eb6b0542668b540e0f915617162e5fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6808af16427228690502dc909fbf06629db795161c7bd165f8094d8b8bd50b54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e07ca107f1b65e08e7305c926e608d2774481ca6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2828e1523c8b39ffbc64e77ab636ce5ef283baf41523ff60bdb3a4f6e7b51c8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..289f0311e6a5d9ce745072a23faa4d3c5ff8b0e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a6cff336a88a4e41f49332cb296aeae5b4a0ea65c7d0fd5bb51ad8f18502f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12d65585d97d7502325b609e575be577969f8bd1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cbfad26d829b9d3e4334e21fb1e5aab4a554606ea641d7ea9ad49b38dbda73c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cec7b89407ac85e8f369255b8735a908c5a7ddf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76067fa7d4eb87efdb98e8905915696e94247d085acaa0879d2425ef64267339 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7ade036f29e5564cf6f2c19bd3abb7579d1347f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:027082cf5ba5dc31970610171374176d1195f3cb0b47d304f083461374a6c33f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f2ed9672f54a175b1e1ec091a30bdc87063bf28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31c2f93017596743e94d9b62c87c503c4a1aa666b1b4bcfcee215d4a9281c8ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0d13a19daaf6fb8d9e37fb636d0f4ec4bf82c5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da7e3b72bd3c13b354fa9df161f278b2dda658ee6b48d2a357cb8519ce1f6430 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1564fdda45f72b11c9dfbcdb7faf8e9cb34d7de0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dd4e4c7f207fa877172cc3617afe1a3b4e1426b2cb9e62f5a63956eeb3f824d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..089894b9deeb25955fe970363cbdfe781ac93deb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16a97cb9e602869d5e9368e90a5a691ce2458e45abaf3cbfebcb679e05cd620a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a672cf5cab5b6e6dca8be081dbf91ffc0cce7efe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44f17d06b383278f3b602098ebac7c90e57b5dc3cbeef4f4a3838b4e88a98753 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2000bfef74b05e73535a5cea9f499b4cb37a8728 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9fec39d53bdf89447494b61aa4ffdcd8caaaa23016a361f2c996b87199ca3c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b17642739de5096dda52a8554fe143e0656717b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa6e9f2f7fdccb753153d67e9ea60662b86b3772a09c1abdc186d9c9571093fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6f9621e4efdeff0cc91ae50479a1228ec1acd8c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74e79b8297122d718fea07f39014408af36bed052e50607063a30926413e8432 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdbe018f05612b8b0cf3474663dc47b5fbf72184 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:177b88e68ed4b080357e6e6afe81c520c031f4adfb775183bd6ea6380169ccc6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4fea352a32574f6421caf3ad5bb6613d16a0a7d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6a33c800c3969c3d8a589214b19ba24f906467de896954887f93d12e2497037 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..01d58945086b467723569059833dffade4699810 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5532c5bc52e4dd1e8d877f8e9006ff4b67f2bac5eb04daf4f71575cea597c748 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff0f8b6517dbd38f936d078469d49114b0a050e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:739a1b276f38621a4142c4ac9dcf8bf89140a747ccaca7f9a043d2018e02cfeb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cdb48ee4a3a6a6af848fe627aadf6ff53cfe63e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b2ac6595c32a8e07742b3de3036ef39c93ce33636045397b5907d576748d55c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea6e369a3b37950f3545506a6abc22274a0fd3a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4fba35ccbed92704fd12d785295e8801f7faaa9b1f20b228bd78f2f77d756a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..97e8e5b5f07575f0aa4d70986654feb0580b3aef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dc028aef6f2243474942eda645e56c4b6469c50dd567347ae8310be7d89274f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8471c63bbcfaf6138a071caa6b1317c86bb59cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91d56f7f89d67b46fd46f054cad2f6f6ade0d7ad2b6ce00dad7bd12a787bfe95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3d76fbab491cef65eb261b642480d8f10b0870b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf3c66f8f972cd706317c210b9d186cab014e8443b650eec6c87c5792a8bd0d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd880ca6a02163a0e77fb0cd1ddf2f49cee45329 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba39112e6ccb568b218671b7a50033edc1fe14795fe4c87d111f64ab4d6c5bc0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..78cab784a57710f74a20b195f3c13eedf261a5bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d6a2b706fe067039fa4307b584973f9bb47810ad3437275955acc4ea61b0fc7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..714bcde24b1d85f119747543eb25fa933a905eaa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:941a6fe96c0aafad7bae368456aca69a89cdafae5de464351287abc002e298ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b008874227c3d497268b0736eb7465e8e89ee927 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:033568a3541f3e7c326cefd6849eb618acd7285ca24dd46b38547686b2831c63 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54491ef8357ad1ec36e3369569293f72509f8d1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc995e59c26d3feb119aa7ed547e91e21e2119582f3343712d19300db4da233d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf39fc265ce212c65df3d82b9278b5f7b1aeeffb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08eb569bfae1a16fccfbb439752b2ed0cf74456c8d26550f8decb2854cf39f5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be8780cc2746ace9a309cb60b0cd2bb5d3c14dc2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd76f43cbe2de2c10b5f04f24db463cca2d1dbff5c356537786000117b668c8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa9865781a85e9ddf2eda7445671fbdbc1d59b11 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad43127bc57a80796c97eec3ce50830db686b45c10628dbcfa8ca29d4f17637d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff20994b0280bc2d5adf7e438171434584fe1098 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a21bd39ecea3d20d8cfc54148f1ed89fa10db3558255e0d657fbd8b3d083624 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e287b0d096e9ceb2df09e33e6b11e47a6a91a920 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c68eaf8bfeb927b257574bc7abacddb70be0df5d3cba9b292c70010fc9cfa8dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..242a60501a9c2326acb42e69880f19bde56a3c89 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:092af25c730bc085163c5a440969cdc9d91bbf3b7200c1cdfb446da05acd802d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ba1c5ee2fd2777d946b898738f134d8f32df1f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56c1950532866611ad0d07ac1a5be4c09922a53958c32814f57da123e057b2bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..daa23ef1bc8b5a70338e3fe84466ea2d8056a962 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd81bb45c52a8632208230abe1d21d0d00a786ee1171d1104373c30c1f7ba319 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..21af6dd0a74f051f0d7b7464b9de219dadb3c752 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79bbd37a2e3c32ff98df38321ead61e86abc35a21218f24b86d06035b5a60168 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d101d657ced0a41a9f755fbcae12dddbb795bfc0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9c38a5bd7b3bccb5d1da9b92dc2f7bc96e0bcbddca769de2924e12f51cd957 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..680f598fa533c0e09ee4247e419d3c103173ce3b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb0ddeaaa6d1afc57280549ac90a1aaca0040eb328e7390cbf20d0654065439b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7c65cfd74ec5643aee443b059d19fe93b043565 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6c5a3cadd4ff5032650f4086d543ade5b104ccbd63963ce55ae9d1d257a7c75 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7692790b9280f7f55a5a42871a28e205875a1c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c31415bc3100147f49c19fd3c3eb7fb1c98633faa406c88a1b1d5392a50d49a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78b95d903a5415fef19d03bd4ed32dc78c2c87e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aad9db02e6f5afdc3ec24aef5e41de934ebfda42362a25aa5f76879c6e78bdb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fbf5b25275b2119d17e2278e3e022586bda88c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf6fa3da6a4abaf583b5f9d470ef07f695a579073affcffe9c4b25e78decca55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..005ce62e9b02578656f5226f5924295e742bfdb9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:430b47a6377afc37d138a1ae30508138f927fe8415f4080c552a4fe080874c67 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f0ce2b2ef84d3a54ef34cfa16e4c62bd908f6ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ec3c024cf55477e46a46327af6beac42acc95dba0b11440cf890cd61b72f442 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d9e14b1bd8cdd52ba8a95f7bf7869f5757dc749 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca808fca07c37686b20fc66571a73594822791634fd641c16dd08121faf4c748 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52fb2bef15b90e7070bdd1b1d406b569b0246f73 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09242562b7e9d89deb5e7acd938cbc90c7e7b93a302eb2462b3f96dfb9658bac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03e13848a3ffa41be38d8a2bf350d9c18d7f7411 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:507c5a198a8c6c8051c4e3fd6918b46ce400d1d3645055f298762e6ad0f3bbf5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc3cc1ea755faf68f1378ccbe7a3bd3069ad4ac3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:771da0cf054b091104f8b82b9f03cf7da30955935b1f397ea50bfe6c03baef0f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae1694439b5ac1be79d912a09269f91109045c72 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3be0e903cef69784ea630559996e73b1166054983ea2ba383030b459260c220e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..44523f30cd155702d34397e782aae78c109e6fdf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5658378b847cc454def46c9e43b8e77282a2bd820795429e852ad6a3e09078e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0365549c0aaa93f82520eb52370bf7289c927721 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f624855b2696c70e1629e7013ecbc51575187428403e690e91a5366c44151884 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..298d0d78e1e485524e00edc3e123a0af5bb1ddb0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2be12e0f773330e71dc2b70aecf1aa85e3c01631778c46cfeeda7b1df87b4ae1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78a59a4e8203bff511ada97b9b27b4f50d382488 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:610f9017707c04fd6a55232040b6948d16aa66d172cb5f3cde99270fc542847e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c2facd01b85b5833e3a22f2a3568598157066ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977335c39f3f07492c0f4b9cb8ae2323bbc5288a5513320643acb99ecd844a11 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61f4efc4100d5f83c8f06bcbac6339071356d389 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e025bd21af01c3f67144755a778017619291b5edb79ce2568b5c666b90c77f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c8009498000a1cc00a9614a9796e0390bdabd05 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efffbee0197f92eba0e75defc9b04948887b6c9a8d2d48707cd51f6c4e2b6005 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bef564aa5c88a7169ac8b23bfa048def4f15821 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a685a981213b310c483e655d9ab637c8a5f6c9f060216a83d6f3e4423c73d10e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8398bd3b576c5fd84eeef803af79ecf14a7863f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be5511239d30cc58e59d2456fc5fcfcfd1ab08f988c55c198a692ae9219eb07 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dea2c2757f6a34391f4e14b379110dbebfc5873e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3459925e18e4977de9d559f41067db24d899140a3a7e97961b68ae23a472b5f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69239793a71c7fcd136fb1fa49a02644d3ec7a93 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac7110a4332d274ae16c85f17c4055dabb54f522ffdad44419d9debd026991c5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32df90c9488265aa923c3e5b9f2dd1bec877fc8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7767ab031af5b4c2e70b41a692506fcbd8de307cc7c2e2d2b5a2d7fe3be32757 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d352b6a1c1d5452ee813001eb614d8ca626c0b69 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:244a8c65d5fabb2661d889a61dde7681699b148add71b7dc0741bd8c9ef70718 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0941e21237ccca2d7aa86bab3f0d326ff9bbdfde --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f136d1df4f9389e8fa0b3943836abc133212c8dd7d6d7923d67b1e65495814 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f05dd571ed9d2fbebf8f6a359dc0d574fff406ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58775629d89cc5d19946dcf85165b913bd60b1e3cb4fe8fa14e732c8d18bf494 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6745751257bfaf497ff3aa86af11fdc7d9f1b5f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f24908e8ef9bb20ba6b2e2341ae7d613f68fff9adfc522ef6f409ccd0d4241a9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b8ded9cc393293b92492a3b78d860c4edde35da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc9399edd7c35db3cc11f2938bb0509f097d7c1a47bf9948768ccb3145d8cf54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68453279eb5eb75f16e0f74ada5c2f898841a318 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b45e8dc34e730022c0f5ba1c3a6db54e32042ec035fcb860e6dd677da545acb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b3b3dfccf05d599717bffa78703b4829040b2bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e37ef3350894ad0ff7ddf1d15b501c804281d4de12eb4278953d32d32e4dd3b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0e95e193bc9852d42e79a128ce67552aeff07ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:986168bdff117a9410b6e819fac31d0dad05d437f096b11a12d8db009503ea52 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c32353a28bdc8df157fefc118e27a401b19c952 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c22e002264553bd855b5c058ee01a20df50326e7a2f9a6a80164cb30f1aed835 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdcc77cbf3261e3af46459915d3fd0d0ae2ec306 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35077a96b3f95db744a4921a0b9591b6065c9e82819530bbf01f2c4dc0f9d0a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06b276b0a2a4c87704117dcf81f1cca659b05d71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d344362392879d441779f5b9fe83fc5a87f97c829ec9fca480ada2fc62540893 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e03f86d78c1e50b3600cd5f8cfd1afd6ba68ae43 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:799968e31a547a0dd97e4e85054d8c392a037b98afc98b58291215ea7a5bfe1c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1612418d3d88abd2e6670a7252b08c11714181ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ddc7a1010155df42f07b1cfc7801c0715e388da16bef7445ba17b76f282fe66 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6027f7c0ad66ee658a139c06d20b70c07ee47ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_15/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb17644121758704e0de5774904bcb536950f7f5d20215fad6e47acbc35ae9f +size 11395