diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b14d2a7cb7e2e324387c4fee0a157953c2ae70dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51c11ffa139f77bca740c212a2298c0e5fdfe1b9394cfd352de013fbf56d6bf5 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b3840216fc467c3a559cdd43533424e4f8c6a2c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb805f947113f00b22822a99b43c46eec6bae18b0220696cb4cc4df6da44200e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b23aa04f4dbfe86354c8723af8fc9a87ee6946a1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:075949d700797a1158594778650381b933bf2a4de5553afbb9a69f224056ace7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2af60dca494c9a01e2310efc4180896f9ee35d38 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1255b476389a23dc6c7eb650f83753ae92acd69eaefae4005198debe409bc857 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4fd245dfe2090405936bc632c6cddf0e9cb53c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aab51b6beb5caff267c772b27514bde4c8ea150c56aa4220aecd8a7e8b3c536 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..273f50e5288fd399b4a4cbd3e50893367d53b787 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13105c640a58ff07b260ceba6507d64a8363f949dff3131434179129a884c246 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15aa838d29c2f260468ec5dbcb55f07ddc458d99 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40f53147761badd3cad324b505d5e6b58a6edd94d2b370c4cd0257f1731a6168 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94912e721477630b7b9783f98a14d46b9d7e2b61 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ed1e49494b3688a11ca6f0b83ec7d3271941a6c7b2d60aac48cbe7df1cce08b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c332e6a19a388d084572d22627723a8a95890d5b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a8ddc4e59cac74bc658fe17b57039258829df64ef32a1c6eda907ec3015d03c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5821dbbe41a1992d764a405458036a234b7f838d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d5d22bbdd9bafb6a4169f8937ba21d500072fd2cc2b647ec34c880e69390672 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4e5d6bbdd78724dd0db9d242f7d92039be2fb65 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dfa40fb99152219952d44562574af17c3dd625bfc3d3a2050e9e7bf58460470 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9c5d4bf97abe57e56710d7d6247fa9f83087024 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98a349b794e1e78c303fa4676e3d1116aa3743f57c88cacc341cc1b2417d9e10 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a1e2be18bf605285dd8985ab8d507bd961e0e1d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8da6720a87c5359e9ada9fb8c0a8038b1f9cd9f120b8cd6ad7af6ee2b184997 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c812bf9284cf08dad12bcc93bce5fec6b08258a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45125d4b1998dcb15d9278b27bc37e325628afcad2d8de0acc422009beb99bb3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..814077e2f31371bb53c6b981f8d35866c47c55b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:086e0d187f38b1fad2a94a92656ef45e031607b7cd9c5ed5727978defda06e7c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a4534b655aff003fc473f3ca97ad8fdb33ed663 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:927f3973ae3bbd9672f58c6e6656d5e098d8c4b29fd7556b3c2491ad8a3c950a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7714a5d0c0488e6fb3b99afed686601cb459dba0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eef33c1565532bbc77282cb482c58051fc7e8c8b8a424076e1fddd3b4f95b5a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65c54db197dda92d59c4bf0f970980453af3fb72 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd82d3da9be519209a0b6049379dcbdaf9fda24ec39092ded652faf956321313 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab0220b92bc5addb00c25abe4c6acc991d5e56c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0b862e0ad89e1f19a7006148040f7ad988ffc6bf25fdc4b18c0319d76a71bdf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb116aa8eff63af2b0a94ada9b0429390bd305f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85f31ebd41c2450a64e25fdc5db2e5acdcfc8fa60c61c60ed80faa9aa4dc47f1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..280bf20dfcf21c971d2b004ec4c83ab88b91e4df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31203e9e154f5c3fd2516840155b0b6a2ca0065820e7bbcdc888839c05c9c211 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ce2b2bee1206088ab76de78dedcff114b1c4a1d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1878d7ce68a62c1e36ee52442a7ba512ccfe5685ea9bcd549faafe28cbb6aa3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb0b786d0b9d5efcf1d73896ba1e923abcb631fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0040e0b686c84aace19b20a678f545cb756d1b74b1d23bf3ae62939b7bc4603f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bbaaf3c604685dfa3e2938aabc5f10017e76a30 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:557fb59a319d0b9ffcb97b02d3285016a21f80e239f4c43c5c54fa77c4ca8a2c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..feb6b74a6da9c50220d2f49e431c22b3853d6b0d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b20b33489b01f4f2d1399017b1a58699f01d8fe4ed47d7762a94601baf0ef4b5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e218d95bda502150979063f6cd0b33531dcb504 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8d1219ae8f617ce5bf189ffa179008d37ceb49f6bda1558c2c0e805e7593874 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f28deace5acef43e81dc8f03adbb48760633444 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cab03cfef52a20680f9a8c3df6ae7996f40193679909bca5359d1e027f566c5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..389ee212d594c169af301f92b360876f7fa75d25 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f6f9f3d578616fbe8f211cd4a8ab7882e17b43aa3ebdb3f6efb03efb33e5cf0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dce8db7b9197298fcfe01030e699a8c3bb7dbbb8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8247d35386523c55947a55e64096c8027912980df221866f92db6075ddeab30 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19fdbbfcbfc7274fd0173ea8162ddbb2a73e73d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72d20c31899e82ab70ff78cd8fa2c8a0a3a43abdd31795be35350c4c492baaba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8ee53c5cc5ce912119a16c2c48b103e56e2783a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bf349dbc250e89eb1f81339bb2c6a0ee8f88bee0c7186e27d44fabb3d002c5e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4398bb32f92d7833dcc169b9624e281020f1d9c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1a94bed1d7b45d30ed7cdc0c6de22816f15651c930e0ebff63db907d9e44951 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6be697051c4035b29666f4731d0907ac9e6b13a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fb05676516a2e4450287ec07305930184f1b2a543c4033e5c2351d0ffe65e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37c4ed5d883cf727c79cdcc414a03eb8fcda4695 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a22c4cf2d7b29145665f5bc5b7e6848f05a2c8c3addcc96e375f4e7addc6a819 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97a21532230d07545a1cbbeadb1105d05a6f1762 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:605317d2ac75126a12f1d8a9dd4b7a17b813a498abed67805238f552fa8d07bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..719f8f67f6524b2c59a4b44c6c231931faedf25f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a3ef534cc429817f0a2ee11163cccba92c7b299f78b2783c38eb85c9f81c03a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..508a94d91fa3ccc7f97b21668a07955bcd3a29bc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e34383e007dda1a5c8fe9ca354829db179423ceae651df381f8bd9afb6aa59ea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..766591ca06cad586afdb1b4ead7459cbb48b3262 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e624237b9f1feb4bf8ad92e040ce21a4c51552bd7886293d22df62c8da1f7c39 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c46a56b71747fe2bcf23d9167a90136aa568d0a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f074476e368926186f348dd1d8157ab427d69601f575824d1227814c4df75ebc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a901a344648616cbc6494608ba2e02f90bf22c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a31e8b7f7a02ac617c42eb0fcffa9925718fdb63d564ce524be16cf0d00b266a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cc11c3c0e4d5a0609ac67cf435bb60862981fb3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b7f839cd5bf62d1eaa1e6efe80bc2e3df50abcbc22ce9d07b0cc1d42f54fd7b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6999588fa52e05cf821b0cc81eff5641c0f73793 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef5b3b224eb3f2711cc00c516329b87db2acab2562b9f8a8cdb5065dafc945d3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d83866935a0d0de2bf2bb0efc2c48e8977fc5c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d53893725fb6bd96e357667901a6393598daeb1fbfbb7342774e425ff5495f29 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09179f0e188a554bfd1c09607709839623171380 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5471c2bc15fcb80d7ad40c1451b47ef34b38d547f70054f34f0ae27dbeacd462 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d8101ce6ce3dd916194d54addf5581113cb549f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0315870d83ed80c9e9b92687474a3c85f28a288ef2c9ab8b285a113143aeebfc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce73f25268bcd887ecac467cbd59d59ad3a2653a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a10a055b86452a1bed4d22d0b837e0b6b1d87784ba24221f95806a55b803396 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..867ea3c539dda9c3b07d0383f0bdfcd8e9443544 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2461e1d10d0c7ec5b5062ef31169c180de3d0e57ee4603e57355fa1a37ce7f6d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dedb5fd738a6ac9e69a0db8dc203b61a8b9b4a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30b797753c3d9d960b646a283864fb06ab5c376e7976136f950224787d25ca68 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..995176f950611e1ad3f68b483141d845a26583fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecc55167efe69fd95806e47045459a6907b2c56e8af37a3e9a2a538f195f833e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3c55a95fd4320390ce94d6ce1b4df40833a1660 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af778e63338570cced2cec406ba901fbf3da530479011fb4e359816db7ffa836 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8274a1e492b3d826a091502a7c474120f76ace18 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:190931b63c0475f0d33ae21573e3155fb7735c74880bde3aa4a699b2df7fbe58 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..386088d6d8ee6d804d676b482b1431ab95c81bc1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbf4d03a591b200650fa848c64918dc3637252cfd0d9aa9a7e8c38f97af81f4b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2a4f5ec5fae94e374336acaf2599753b263404f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b58ff75414f9afd379a8b92ac1896132cd0e823883bc4d7323b4aa31264c715 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2d201a88095bfcd574c8d73841b7a003e5e2f52 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae12ea0e48ef07045196e527fd8a75f306698801ca1ebb14c5ac9aa6d9ed3d45 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a29b32942b5b99d0fe3f1afc319cebfd5301bab1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2addf7c75ab54aeb21f6dfdd696edbe730acfdc162e0773076cddb647fdd0332 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee150352115d2c3a55bb4fbb8b1e33faa570d2ce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c182a1963e9dcf68506ec373d766dc00d57dea5fd9f2d151d4d6a0797c64d42 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d279970a27d3b70c244d07360b1e9d4f0aa5940 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:244b3d1cc510964868e7861fd93261fd371420e43836a29a17c4bc3098eaabf2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6da108f987442a9f295d5e66637e703da3e33ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4d4dbc9d6f4c1e10cb76f01cc3c875fb932204837f04b10e0b454ff49b27431 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21b80cc72227f37d9abe3cf60c69733c47daa842 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a1d9df84fee24f085ef7af6cdd9484ef1a6c967d15ac9d1f693b98e5b04e4ae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ea84e14f65f30c14c21c3488bfc6c286bcc681c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46be3cbcf88a07b84fb247fcbba7233e3c5012c77317149a2b7c62e5c1bae68f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..010a01f8a000f2d29431af5c871dc94b8bec7f67 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:219c5bb0cdf4a7591b5d86f646fd91033923ebf4dd2881507b91f33ee1a6a2b6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ee3c4aa32a4b97c963c5b6ea975213f4c4d07cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f850a75b72d5f8cc2d18d32f524b2898c2bb21463a4449e9e116da6e3dee308 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ced75cdb851364ce9c7b320044c808d650c63dce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b64b4de28880b3121e3bcab843db96e389ac9a913f766d76700fe080a57f6d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49f9aa60661989104d087923d77296573b3a970e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14916d835b3c1467114cede220bc596ada743646a088a0153a50838452595115 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e774f964ad6d5ed99ceac69c43975c7ec0c6e15 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dad9fa383aba2e1893c686f5bde36a8f839f150206c005c9f5c12a6bb4c3279 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3edb4682af1b951255313074fc1fb9564f69e3d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f38cb82ab088954f511771f12c9fbb19685e489c065d6b09904537af8806d547 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e8c63b8d78cc8f3494449842b300117e1c5e94d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb7051dda51f0a1f39b2653d8d714749a89551396892d26311b0d28f91621ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d14bc57a0dfb463e41497edbdf5de07826ca0264 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e10b59546ed20519e17332d7958e3019a719c9ff2d019996fd95489a3f07f689 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cc82dd041d001a6f1f31a6136df99cb273008c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a36ee65b9a14d2b8a8e3021a66157a22e4cfe6f5e74953e5ed6c79fd11083af +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..383e70e9bb2299d68424999a5047a112adfa32ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f129892c4a4ad88f4688c7a096af4b66f57779236dc5b807f13a910af5058dc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c581425fcfb74bfe3cacbd257ae39a134b57ceb3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9699fba95e7cc7d5018277c7fb87856c02d59788ef4c3bd15ed78734e4b90718 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2e55d60d7fef9b465d2c2ebd5979ad4857e32a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5026b0d09657e8eca5c9574d2fa4b6bf962a7519280439927a645f69fff30011 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd7696e1665c04b06ba8cd83f3e35b7fd1c5453d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b359c50f8b0c7654ffed35e614b53dc59b7a36e542bf3332fea3863baa435a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80a4c450c38553ddfa9e9e75ddabb06ef7ff691f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aaf1e67db5a131fd28d11967cd27cd74d02069bc95eed125f997cd29c1be61b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..387b0109dfa1fb247d1bce300db2f87124ffaa2a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5d78a50bf9ea911c01ed6480b8bf875afb446cab2f3e50ac01c6e9143bed71b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6647f3d8bd338abe4a689d05e5605d594129bb9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caa91ec469d4479f4d019c98341507fbd4b1ddd9921c4f61425c59dd5923fe65 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5abaf56ccac03cb4e3e3fac186f37d55968e461 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:740c2978350857bf53b4174328196316c0ae33ea68af568b01fd1aaee77a323d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4502451c1aede930e25a2f4105f0a50ffa4ac258 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e35f845f1de9ab25577293a1fb370685f00a16de70028adb2bc1d196143f227 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9397758e6c7c8e756692598cf8871e608403d104 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c051b44e9e3b22d4993b59c68fbda1065426c29d9b268b4e952af86d74eeb004 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a94b239dd461584fb5a497e6622fd297f0111097 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba22265d6f466ba35abdb6be873530c7a6fd1159fc1ade2a59b2d7b304de70a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f97542976debf13063d8095a1e5df3c708c0fcf1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9be46b767440b1fe7f34d504f06fd69393caf4d065733add00ba8f0960408835 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c77d47c01cfe4bc2cb7f69717bacabea778ee49 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b0cb8d79b31ac930710b4df02636c5ec4d519494c1cc5b392575e1cc6098cb2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3f8818bcf6dbfe61b5592c2d97914070c3e920f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59e45c8d00afd1934c3593d48065ad6edb1b287aa5f4e9557856dee4622568ea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fc0225e0715c056b5d6a4bfa8eec2162a4f983d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89380e4337c469584406b3ea8cf5aeaae484a388208f9b1059d317bd020b242a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eee6bfb19e48769cac895c6ff2f7b9809990b30c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2037ea07dd14d41b974ad60783175817286cc85ae75154dc2e36280ec1e94488 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed59f5a529f6d8c435edcef687ff122a70ae244f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1562f665f7861ceb9040fb276850f8b5a6014996336dc3d5b11bfb4f1188cf7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4dbb52d0403321d64613b645a30f67f0948020b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afbfd535c0574d14978dbdda42ce8a9ca6bd1a4804c9a8de95796ef08bb3c80f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9e568fa501e31926f73bb022448d1a29f6f2831 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a45222c23c94b78da5e8e95481ad4b454e699bec721616922d805959fc400237 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f466897a9f488e1f9650df4ee77debe06784d7d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f42a0c2dd29e5c3bf90e85c099e6000da2b79ddf1d63b40594b3ddb8bb59628e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdfa4d575fe9a30df43775fa72443db81648fd70 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5d897eaec341849e71e77bf7f8eaafd5cd37f46e731241636082063606ca81f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcbccb6d85231ab6db0f8bda57852ae11aacf453 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:771495f123d114d1aeea4d82a3be27d903e97673f1866cc40d43c8f445e9e3f4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ca0cbe8e5c40796c6789d5cc0efe9e460b59a34 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9b867c59ed71eb204edabe4a83223992f5051f051e2464467c283b3bd1c2260 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..718f61f42492485c678d19db0875fb433d68a6b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6abd44754e4363360cb2d6345d892c50d13eb794c10f1aa6b2f4e74ec97524c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c1f6d1ac9f72784bdedfd85cad8bcc6bca56866 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b4467003c144cf08cf3c293110a9ae96fe4f00a3034ea9af43c3d7ca4829862 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89b06a2f11a2207d5ca69e25e6430af61fc76b83 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7d819d41afc4a8b614046325b83074f91587d2522e347b8584dd7a0f2373360 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1d87678b378a27e0701004cbc4a962d917589ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41c2988e450f2097fc9b45b63c6cec6839adc032f0f14005a99e0f29c231995b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82ab283092ce470fc5de10a3bcfa2cc5da4f8319 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c998b06a1f4d5f67429d5ee81a0be6d5b44c2894b54bc07db35854a56a331d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93a0f2f82143584a41144240e076fd552b5a4e30 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bbfbd947f955b6c3bd7ee431c185b74800f2881d20d02254bd03f252df10bb2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f566b5abfb4b87c884d1ac420effca5663b25e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25587f895a49f1da2954128728c3deb9408c0a97570f1becda8460d7d90916b9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fafa92212513c8691f8fe3f30113608cdf470a4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7a96d8f056e67c645f7b0067928ec98859a962096df3ba367b858acef81853a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e00881ee044167275ccd63033ff4acea3778f58c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:418126a191d4eec8e2337f4528c36b93a5590e00fd3476011701762b58e8d86b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbcc24ead03ec6dbbb5bcba35e2091edd0bd77af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21f58463a74bb8da0647ad67695cfd14806ea78a29867c757b6f95a3dcac981 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20ad35ea1571dbf1f727190c5a01f6b5669be4da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b01bc4148b3bc9ba6abe11fd0cd18a219a1344be86ba0867fa6d26ca7413683b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03c0ae144ba82031b4e79024b114de2a06680448 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:679d656fb8dc618c2fd0bee07fe63d65284b95d404d2cbcc2cec13d7c2698a3b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44733315557e39c869cabf6d68a69036a24b7ea3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:396528c49204db995df7efe7672e7abe33216048b2bccfaee98763881188827c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a862151c681ddd4ea83926023398308c1a453bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c139ec28cb86feb16821c30c8404a253d16a068021fe20ca314a36ec30a73795 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a8d75af2cf4fed84985f8966bae895223b8f395 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f0a14c805c2c19c50536f2f2a79215e4b1dbc2e88e73d8e2ca3c047142ad0bd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c1bf091e872ecffbf752efe075c99c30187e7cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb829f6d2b9f21644d135a5a8aef01ff1c670e443abb88c065808fe174caa7c8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36b0968de5d0c8249d28710268e4cddc8a04d2f7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ed52a721335e938f54ce858ccf365a70d765663248e3ffd95fefc116e2fa673 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24c745a4d37c66b21478cff05cbc71e8a6128f4c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3425cb60062e9ea8e3432d71d786688efe4d9bec6837141a3d0df57b16a738f7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8fc460c5d04c638522a6c81025d856d25bf6086 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d5b12bedbc290f9196c37560405040d1568bbc9fffd99f571ce88aab7ddc662 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c408885d73bed61e4f3a412ca35dcdd48f33928b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92149a01f3d47dd16b06ede2d19f816bb980eb8a8bde1b2bbcb9fbc34eee4b49 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc9c919c3ea8a0984f8124aeb2cb2ee3c3526f8f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391e2bc78ae8dd6618eaeb22605fa97b741c5c9becd7b06ec57645b93115c855 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..460278a77e0067990b7984087e8a200a19d6e50a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fbd77efebb35abd1ad3dca24211645a56c6747c1824a015f0a3931b3f2e4ade +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bcdca78cd88a4ed43d6e87ceb91f3dc9c04e7a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccc8d26c00d65d854488b4d09c45c0c0c832f4b07af3be41363d7a20da95cfb5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a677dbdbb001692264ae0c93c1fc1ddbd2c4df58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e86893b5c344a7103115a40b97634e106e31807a4cb09162f61cb84f07a05124 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04ce2eef4b9a6ddd485e0ee0be03253a3ef25635 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e416a98953eca941c470790d441810c0be2d77c9d805045f29ce9fc9838bd9d8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d20fd7454a39cb318e8622f4324b6c7097093681 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff29c478ecf517f94915cc6b94db68dc7bb2b4015e6d643e8128b8c0be65bf01 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bb081f714dd642e42b8d0a5a29ea73e0aa9e4de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5beb5e19b4bfe28b7776323e80b3003738d78ef4a01d026c67afa055d08379d5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79f9dc05cb122b93185d2f96b2b336680c39c7c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16f1c22cc21200c45b1c636cda7ab5ad18de6be9d75c4057fcebf208f1dd14e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3be580593e0cf05f6aeb083dba24f4007fe4fcb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:891ecb28ea2cf683e32a1329a983451da35309479ec25061d21c6fb110f13167 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f714199f2252955358e0be231ecd1077b559b35f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6218da5ec62d9d4dc0b9be3beb75801388b68f250f68413817d071f74e0142c5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf48c56119de0c2a1810cd2eb46db1c1eaa78d4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:645cf3ed17e0fe4e60593f8639fac2baf0993df26f8a191d93c9adde834e733d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..788fa7c1e3f7fe280150d9a78464dbe55cb9d6a2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf48c9a5770c6c7597536b6bb8350645cd2e02d52472c45da2f6508f40ef6fbc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c850598da5de5f86316d80e128ad259a82c49b2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:405913ca7f236b574f6c04a352fea5e1e7dc5134faacaccb456027e645e0fd96 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc2fdbc20a20b387a78d735d3d09cb5c40db2d63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47fe49f0510b6c5bfbb1782ab019648c249f10daf45cbe7f0c5437ad3e703ad1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a826689d45fffcde8de19b67e20d687ba5510a5b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a07ddc6bf3391a6ff81e813095ec6ef91e5b21c38275ab9f04b07385b6abb55 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e063a81c0b94b69d6fe74cb4539d2396f5772642 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfb3b155ab128769d003d872016fd086a1df5302972b5829e44b011d1eb1cb1b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..569f6facc31f0fbe376c2f4e76973d7483db5701 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11ff9d1506a4eb70539def59e3166371d81b5ed3688b946b72d669de1114a8eb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54938ed5b77e8ae4c59d86dcae5b33b91cc2ec54 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75d427af6b413cf98c8203451e7bc4a0bd8c2b22353cdd01f1752d99115b6c6a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71fbc61c98f6ec0c6f6c7bfef3ed2f337afa8be5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b421cd64e20c4a2a4c89285c2feab781781ec8ec633b8c091b734e41bb10f79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eabdb806939b378ed8dff9e121eec5d35578c03f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23ffb645e46d580716be70a34699ee73d6a951dfb1b384008e50a571ffb490a1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a286b75c8f168740b5222b81946d0d206c806f24 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76d3dc7f110b05ef07b8801489fe02a97afdd4d5ccbbc4960fbf8dfc3d233c39 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78eb515a5c8656d2e4d5b15fdf0da2b148bb3338 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd4bd85da8efecddaa712ebb8fb9daf4bb20098f70ac88d03fa90fa4c1b90972 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c09c499b9957450c140e6e08ffc5f65bf66e15ec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddc4662afbcbf87cb165fb532b8c38285f4ffd6731266d281019468c02895987 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8836c42bb64289693fb23d1c62806fa6373ac751 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9a83a220f0434fdc3facf12bbf90629c93ba723b39edb9bb9f1c269a4bf163 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b2956c3fb4f68675f91e1a8eb6ec0fec82bc370 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:319d7ba50fb3d1751ca71edacf20f37aa8809f413b6134517600c81e7cde8edb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c722f9f7aa9b4105d0ead1ccf834e8ea5e6a9fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0f7f050e1dc61f86d7d23857ac5cebd3b0e85727086158fad8755305b47460c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef21ad43a103b453a189f01271c558337945f1ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c401252213960dc2ae61040fb1db08af1754002ca1b4a26ea43205145b4c1cd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36e87449b23092bc91af23e945d6d4927d2f901e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9832d06c93f4e7255caf78755a6b5a64de8d64b70146a11d9a90112eed358ef +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..455b4a1418cb1fb3a70068fed3daa38b66d2204d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c444716ccb0df84e38ea1222195775f4c91d27ed8bff446e536a51de779be210 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07bbc8b769c8f1720b7667c0f133b6e1c035858c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a98188cfc0aa0b12bcbb71a1115928a20f6e4caf71668f0b525f7481ae549979 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cf730d408d7a8843bbf8e784cc138eeacc8c840 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a29c61c9ef88b2aed08cd968380e5b9226fafeb3fed182c03faa038f81a7401 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..060150dd01648d726d7895e34fff261ef038761b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db5cf54ccacbdcdd5d6706515a37d6d859e2684431522f695637d9c60beafeb3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cd523e84e76ab09b2277e9ceedea1f58f1f3446 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6bbce00bb1328f97ddafc91b45a5901a32ff810a1f72722d44c00f557611098 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dfdce75cba1256c6a5a25fa984f5226d4eee952 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65f6eaefd61d5f01d0a3a874a4db0c47adb8bb18cadd68d4c4a750bd450aadd3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c30dbcbc3e3518c55d9d96ffaab7ddec7b358c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27dc6f6e24d5535059508186e7c2ba67aa32f9f53710ffe4a4a09be51251a25a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..955a5bed6e909b28306638822dc13ed27d70e336 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76dbbec74bbe593a1fa74b6b218c39160b607567879ba1379778aee621bb81ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fdd4a40df0bf0cdeade8c2df8484331f012e5ee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17f9662e5926641af6470b33cd9dbefe08f78954dde58852ce80af6326461d16 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6234613bd47340e2366ded9043d7773e63a93384 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d45970c29a29be4668768982093db4ddb0bece665b886414cb9c5c9308910d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e278f49ab380776aa6a5737bcc2533a1500525d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6be67908a9c52f5f5051bcc212907ba4d1667c7010f565186dfe63347696ab7d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84621b83b12e206c7c1e58e30d9221ef46f268a8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb01b02d2c19c191399a177cca54c965154e289a829574544b576a29d1eb781 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d4241946c5b0fb5dcfcf359d8d3f764a31636bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea680fd9e3fb667ecd46575110a84b0cf278dcf394c18a131dfeea3f03ff5f4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..801a64617acc95b6755e2b9d7ca0da0b4dddf813 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1b3014f1c3c79b73061ed19abcbe271d8f0773c4085baa40f99f78358edf13f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c700415715e82258032f00a2054891e251a5fd15 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02f585b572baacd8cc474151027d867e541d9bb7008412ab5aca0830adfb4f1e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e23338cb5e0d735346734c06aa9760b2842018a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab7601cb3034947749a7d73aefcf64f8684b70ec61a1bf3b1f789b03d88b108c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4bd69a6b50a28f4f770cf4275827af033782432 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64bdcd8fdae6cf8e8a20737a0fcf55aedb42b8b4d57474e476e3f07e1738ef5d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a56c3329cf08a5b3945e66a2e95935fe6c5a1c90 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00dfef667507b926fc8f360632cc301027916fc1b444981ba62ad4ffad860ce4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a41cba3459a6ff6693d15c808b49c0365898a907 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7013dc71e3fd3cf61ac6631ff11638bc08d71a5eb5f3b123df45950fdd20ec1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..803013f22e7916dc3e75472777c435c2b0191564 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41a3675a1b7b75fa8efcc737cdc813e7de3ceab240ec74687dac7a8ccc961e8e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7c6e1ecf0db05fd757d5b55a41d6e1df73462d6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c1f9bd3ef9a3ed50df40ba9c8cba82dcf410b48ed38b4fd4bf877316c86b1a7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6725b46940e177648562e5c04e58e64e04632cd4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a40e974430ba942ffb518e341be16dcaaa0306190c3bc65bcd0c87b95abad2c4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c1176f47eefbf15d49603557700431522569618 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:998a11ad0c8dd0eeee55d28c33a22bb67dbe8c2d88e3889ee1688332c4df9c8c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5405e9a320f9119b41e7dc6531212743e4c07259 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be7526610c7519d14f3a1526847e5b2fb91d2310cc703b286329190969424416 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd030bab3c02efe2f29e2d5f507435f8a973b647 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f485d5520b00046596f92dd08beb9b92bd11c3641af67f1dc441ad084d2c8f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f992f757013fd8c869e79535590bd4e3a3d5772 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9dcf061f68e079894ddf9e1cccc61aa2eeeeaff5b178b8464a39ad28aed4ee4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6008ecfbff9fe06a723e401b7ad41e5a306ee9ef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b6fa333299903058b14d6d97662e22fe7d4bb3d097444208ca6daaea3619fb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49a4b2e1acd0838ef91ce034a0bb5d76d8759f74 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07b9cf0f5316210fec483c6f0047c140101f8d807bdd09c2a05af4cce33e7dda +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bef473002272b7f6a88c4ae1eb055f14dc4fb62 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4154fee8e428b22f12b435a90fa9c8443fd557cf587ae29f28c40a70f23ae482 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..030fbc935fa9979688c92855605b8a7291a1af6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b4bf8daba62e1b7a28eb0bafc12e4fb267451482cefae6ebe16ae8b4d1c3fde +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3403e8c80b73254641528545bcf8cc4217d95af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:858e722da681541f9d80ebb339c95c6588589659e074ce5007d5ccb2fb077fac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20d68e3af156df8d0b86a5bf90f5586568c10f28 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdf1ae867ff158d3a6dd7b2862c54f3a4a24df3b2a1f9f16ce1c45ec0862fcaa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e84d9b1be123fa94b1a4fb6825f13faa5dafb0f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff2c98db1d712ec83d3b7d3a803809c54a85ebb09b4b0992d54c1b39c23afe99 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db7cb50922050c2441d4697879dc18cf4723ebe0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6d532884b452bcc94c710139aaa47a254e996f2cc4cb3f12088c0fcaa4b30dd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8127dddba009f5a69001d8ee691ae4461f4f33b6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f40638c69cdae845bf263a489413328c5e590941e73a2f58a619a265e0496a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25a30771df8bbed062c7f0a32fe2e4c1e3c766cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae4e1298267158c1ccdc8409e79849c73a8e8434e05d7ce396143ca4d59cc461 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cffb5719f24356ec4cd582075dd2d4aa3cf2582c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:715106f1fda58d2bdabd5b3374972f742efe0fdc1fb27c0a75a163aaf8dd509f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da47e96b136e5f946e7cd48c2fd4393f9c085f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0689a81bcd006103b995a0018a219e5aa553df9b7010f2ea916235258d6faa2a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02c993cfde5c65fba879863378e0fea9d6d1008b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edd9dfdf058c4b08d625f640c81168fc1b8ff4ecf8a9531e8cb2390070628392 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96d5b9959e72dccf5c3045dc8325916cbeb087c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:986e727a9feebb52df451535a258d10f7434605012ac4040d79bcd1fc41acd8d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab6ad547ee2cca1cc8a269e91ff9a167b6c7be40 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c4449321a346d91076937ee548a411285e81a80df610046ab9c27761353b2e8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22ebd32cb71577706dc756f43cc713c48748d0d3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c0b82f14003634979eacea3a09fcc7d4951003001014de8df49ec4476ac0e38 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0038c5f1aa45384b9ee3ab4ed6e6efb48bd6374 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ae39c9931df22c5640106e6284f64a2f65a833b87dc2f160be4318cda78461a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..381607d5622bd272180cfd87b3c2cb41edab5d17 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc8c98c462303f45f0f94371c87582366fe655819c9f2c314be4ae43a6b4480b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53702f3a12f12e3f0bcca242f0c853dcca029e77 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b457cf88b2717fa71dba78323f40ec46cd19cd5893a86131f78c4af0d1a8f4d9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eebe10065d39b7f1bb0c2d994f2ae3b527a6c97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15d122fa88a0320789c13d10d63fa123e133941d811727b4d376ac0ea536827d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec25faa0127101249ccdf0c16cff72002bdb7aa1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5029e81c0abf7fd082aea9e1dbe4b23edd55fe3a9f9a5814225aeddf376729b5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48d7939b67599a31acc39421be724e000a44d9c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:129e18d1de03b8fc214fdc6698fb4055d6672042a34535813a52ed843c1f6ce9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9638ca0c89b0f4edc372cc955344f6bbe18d70be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e1c41c04488c7955476522341d73fb0e182fa819dc69701e6015a5737c0a4a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..295f126b9acd5df01da55d8f8465dfbf51466432 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39517f8441daf4248257b4d15d02a61217bc3a35b1345b16844a39a7a48e2792 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d156b3f11d8ff6d642ad67ca9ab74cfb06e5aca0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42aa66b2a2aaade8984738f5b634aec793a0848d65c969a30d05feb9bbcc3be0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0262765fb796570d88d31b5761445c9140e5b991 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2425a84cfd62fb026bb508746b6694e408eecdf13b7e585a404523515cee172f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cc15063024e92ec77d843b130e302fca731f589 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca0a7a71dfe4a984769d2f5adeced7b9ba7b8921b7bd80b78d47988fec7235ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bce86187354802344e11cbf07f780c08d96ddef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe2830c1de55b2b2a8417f0cdeaf30452db80799daa7b6e96f30ff504c0faf38 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fd75567d71e1d6a2dbcd154da215654e09517e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09a376eac0ebc54c33fa23b657eb9e41dc1337c9b368d5a3aa2fa1a7b206ba5e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95f1330a1fa9f2e701f686d27b44628f7da3d0f4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2efa6173e08899a726517e774b1848b16c302b867bbf8c4e1f2beb470ca6e1e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4aab398f4a7795948629e83b4661c896712d957b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b920be3066b7d4376ecd6d23fa33fcb289a2b18cca187ee508211b10b3a6446 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..336fbe0958664ffcabbbc0f0d5fdcba65425953d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0ab2f267cf946b52511b15d555406495883e02d88fbbb88baed22dba452b7db +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b557c6b80354126a0db4f8b104be044c0c3d5997 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b929550ef51d9eda486526fdaf32849a1efde64cf592d892b38d351a1d39acc0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b20d26324e1737a64ab8154262452afca913f614 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d987af62a0234c4fe512f0e1d29451528d3d97e9f6aaae76f6d5bc87d8313f65 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..895e13f58b194c2ed4dc1122091d1f2825a26153 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d045b6c89e9a3fb5d1343295ad1cd9d2c1984f53fdcfda34affef72e703864e1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ae2ca2c7b2f2bf49e2390c1710df3a53123f7c7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f89f31d8209b5373160f2ba125e09c73c788d7cf6f907c558521bf0554419245 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d62dc04bf65ece3cc5d2390177507782f4a336e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:302316eda5fe4bccf03c861592bad447006f0c92ec7e1f067377ae14ed604fc8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..efd893acf130698e53f1feacc5427968e5d1b405 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:984cea848ac3083acc12fbc34b36e1259c7d711717f6abaa9a881b7d16a2d3c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a616fa57726284fee6202b8f3cc2cf8afe64bce4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d671ee29a4b4ed20db741f8d686896964070f4135ee0fc8622b45fc5517922d9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7a74199dcf7c67981871c7756670bf7a786022e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a34c857e4fc64f117597982c3996efdc6931e387a8adf2e0dbcacfd6ebfe4390 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6659855950449b75af9f902c3f0b8f987cc4439c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b40364999c9a5308687681da74f311dfc05f4210591ca9260b7b47538de4aa6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..172a0a675dfe4d7a9184f808903793aa4154f5ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:043686915888dc35494eda95807a00adf72faaa8fc17ad8e50487e89c8fe27f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b8d9a94da89663358f9dbea011ed2342a41f4d4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba015c6215b234e476ae974fbb956c95dc1f0ab851df8dcbe495f119c6dba87e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23722e0112cf775902de5102280aa2201f1e2543 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f326cfb2c1a42e5f6bb3bd8d969c8d4cc55b891b8bd3bb1ff8670eaa0801471c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bce2126a19fb457185c07edbe16becddeb86cc6b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41af31fbfaf835ecc5cc50ea61e57be0f562ad2d6ab86e3b7fb98f2b92db91bd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4ac62b917d17c4c52256e7c4d6abec240df2bf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6128e6f2112dc5af85fd8da94230833fd2fba68015a91a79aef84d9062e12bc3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de11387f2ff3bccc6b5d49ab16f1f93f73cdfbcf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8fb31a1b679623e0c14c3b4b13e10d15f583ef07dcda0de6b2b84c17cdff99b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25be58c0f72f9704cb4ea43d3d69b0f2a30a1fc4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf8b8ee0ba4a8ce755b0ab3f4b32c135ad86887935f29b6b43f43c58efd770e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1640f4e0281d00e7b6292181febc51ee303c26f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cb99396bd1400d459110399a93b22eadc170e09258969ea06d55f407e4d4b22 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c64ef533b82398e1a11c935a66a862ba0774ca0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c36f550939fd8cc532f800811c71f4ad379e6ebd1a5bf46db6fdc43cfb72f60 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01b39ad25d63f0422e33ec76868adae701f10717 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fbfb98853eb5f4cb8dc653cc6b9070ee8d51d75046af54b4602c32665c8b84f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c392d9fb0e7e1bba41e892e13ca31ea46ab27b46 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca15010d1165d859ab2091684c149c5ef34eb8422a39a6d20a2e5247d44d523 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..721ad2da13549f656e71789a2cea33009eac46cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e159ceea8cdf94a4fcbeae5271d0485da8de4326eb634724b4fb8a140a57f9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bccf38402b0b4a58f56feb37da93a6a6d9a3d42 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03f202349d3cfdadd02ad0192430a314b669bdc5a80242c1a5773e0b01391c3e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3c9e7f849fcc49692b3196f7f6864e7d08c76ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f209cbaaf7aa81ff4f7f1c022d06fafe1ad43770edcdfe026290a2ef6fd3659a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc2d2677f27c6223ee1dcf8a0ee03eb95ff94d72 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3c9b6e7678e9f2fadba3b7b83f2576d187e171769484d62e8bc3e42056a381f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d440ffcf253652f6b477592e1080f4561027757 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10e91c2a5c027a49ecb1bf63b72e4b48bdd979d2b880c0edbfeade1bbbd21c51 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3f88d9fc755c45f06403481f59edae4ac2d1f9a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccaf34dc89c9c405b42632dca73b2c9423e188c587a86eec2c7f1f46da7fd8f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7030cddf5cf9f4ac759df3fe6c40fdfc9efcef04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd0df8b48d65b0a1fdf0a8fbcb00b57f594bee604f0158e88f87bf938ff38f34 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f73ff54b13ce8b3002ba4dc51bf37723e8130f90 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b10f70c1a4836b02ec5696335f060746d0e98530810721e3785201f25ca26c9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8206f570a202c2475796108d811d0a527f30d786 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d066805e25d366933faa8bbbc9d9a99a7e6ab1a6d7353299ee28c499aeb4792 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ec630881fec5e694f6611d7e2428fef3407aca1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29d80fa5bfb00f90b6aff8c12018799bb0f30dbad95a092cfbf5ff15fcead9eb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04ba926bb8c8166bd7f84a0820a8dc989ef1947d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:880342a57cfa3a4e46762f13892c65509456e96451e9f736055f6a53c90c9978 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57618c4bb6890ec089128e120253bd3d106f056f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5164b06a15b3bc505922736becbd0113c39256bd6d426cd9c28fda635bdb2dc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88a4c0b547050b209b2ad4d4b91be31ba92243fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce312de68b9d28dcc89f87888501ed1b135c31e53ddee535aae0470d73d50ae9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f78db5082aa99dafb5c4cb711ab6787b813bfde --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d8ce98f3946b5ceafcab93180614856e2d191c412172692b4a96bddb9a79d02 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0f2356f2b4bc8b9dfab6665cda6a1b14271499c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76eb07eb3ea3283696be378af07fafeae8a760103a872aa2697f1e6790d0d936 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07508beb33f38eb820981e4c9eccc17e295546a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40b2b3da9b4b6e3cf3775b26c65a8a74c83fbc8e43be58b2bc5d8929a93613d3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9df298f1cb3d9912f2d00dfd07abf35357cf545 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f40430b4ec190035fcc836a47356f442302581e33b0cec57cb6d4917bc88a3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f112f58a326cd40bcbc7bdb99104fb3200c819b8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88165fdd32f7eda54baa0d8ab5d494d38f1eee7fc75657ee8ed3c61cb1a07f80 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc36f2e56e206e8adec5ac6156549d64999640f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:037821e3f5edc8708a9718cfc2551587a1503c09bdd553c8d8117f6c7ebb59e6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34c0000c48710630a52d93dfd5afea9fe1ab4071 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6caad7db4ee2d4802184d8dd7192e61e672a8e9b6a1f5261e2c2a9c87bfc2a6c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fcb8b97c240a82d5b16867fdc0c8f8969c12a50 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f2d407e5510e091586d38b0377e069b32e3d0a936b8e676f594238db396f43c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10f6b4ecf5de18e870d0c78ec19fd3dc7b0b000f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1581c729dadf71afe03f4e897b78b053e3d93759f5911832782841d72e8f64f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..717386c311b3625b0440ab53f6f85b299adcd6d0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc844bb48777cfb2eecd673a02b589b553aaa19ac7dd00bc559b952a22daf0a4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2daa2a2615f77c18267b7633655dee734fd6bbb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f414094e4ed76f101775c6f52afbd68f388191877036ede96d47cb662ae012d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9173c9bee79636eb0162a3cd15bb7eb93f88b10d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cb079250ca2cba0e3fb08a52422d825bc395a98c12d2c973061c8fa4096a74d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..357cef7ee0772dfdcdcf568b853da3bed7af3db5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a67bddd724d6429ba08874739e540d0a49d1cac43499a9342463434a0d909f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78e155fbbea0367ff0d01f9a9665876497850c5e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a11db1b3bba5c49c44361f5fe3970e3e821e58998589055ce7881ce52b00e87f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98c4a2f571481cf5adf5c541d93e7d9878fe4117 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:802c9c8c5d5084d361ed4eebbb2be52166d012c0832a30e52677d197f5f40432 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96e43bd0de329b4d2920377761c54b16faefe535 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7156268ebc45c07a69b2fb326d5faa8aa60a803f1bac583b5de3f64275cffe3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec3bdcf7da113435f6fe548c7e986802f86c68f7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a41e1be50bd645ca9476bb013d4ee991b815f63a16b4b0004ffd62c4189eb11 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7debbb4916cb5a7ec706a83d394864f098087e53 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e6db1675eda2c0f4096ca58e8a6ff7c24da893d1fe0923958a5f35617e416c3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34c2649f72d1977961e2746f84e477ad837c8c1b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f676613a3ce55ed8290ca68320fdbeede09b8ff4911d6465aac691f41845bbb8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e946d23ef3c9f338ff7c363f254f2fd0ee5d3a56 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af3131db316a6086a32833f8f0e228ef9c1ed2f7084e79f75d14d9bd73aa2132 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..235ac838b872ce3efcd1ac80b77fec6f9a47108d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d479fe22a24fbd05e7feaf742d09c1ccf3fa2450cf615e8a0eb9d526a7e8e09 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f56ea646f3c4d4142bcd0592deec27e5b2104f6a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fcd7ac45ea987e832bef6c0db1f408b27a15463d997f06dc8431ac8009a4357 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de47ec484630029df22dd21b9b50171968a9c1dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80e614b9720537e5f53ba7323583de5ff6d1eeaddf3d6256cf82fb72dc09499a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73486043e202fe47ad373ca1b8e4f8d74bb7fafc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11fe2466e759405ee35260075b8bc3730b7109e67d682607245d45f96a7527c9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc1b8831c7b4e19f0ffe7c4830d0017b8df2339a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:663032ce95d2fe4019d15a923ce264949e9d37d22eaaa5b9234ec62366e78a47 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0d6c61dbec17fb0ba9b7bbeb0faf198fc5d1713 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d9e85bbbb4e5530065f74abbeadb35b98f5daccb1915e71483a284dd466ccb9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df3458cae55511d81d014176520c489d12c41fb3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02f6ad0071f6b20c2272d7da508887b0e381ee09c41c8301bb759a2d9bdaa380 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16a84e8acddc9145748f3ec3ac95acf31cc074e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:715afaa0c9f6fc18e594055846dca4cbd7ec3bd9938554de075d0acd90e822a3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2252c2efadf06a13c9fc66057b8643c155f41d2f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:468bcc83c67afe67ea4b6283a1c39deefd03f635ec8c9d23f811d90ee8e5d229 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40e2a8576fa82533cc38be172d89295f949cdeff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3668ef0924b09d7077f44cbad25d29c1f62fb73b99d85e8c727617a54a3f77 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2261cae9efe9ac0242d871dbfa1bc5553310e96c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6107ce03ec64ec57020a0d187047704a354a9fe964b77240874bafe9bcabc5a5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f4b7f138271a711ab4cd5a1880aff529f26f4c7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc71c4752ff2e591668fa17ef247342d66280bc3b1709d906a08859c64f95422 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d70f85193ee4b612e7f47d0f0987c65417c11d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7decdcc1a3929d3c87be708db9407e034a03169e663091f3f9f1e15d8d21fcb0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd7533f58cb27ed14c832f087df187cf987e4561 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18470a079a52c4498ddaf6ddbd8af99647005732d592295e56e85026fb7a4079 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9421c4d3a314a9af8cadea90742f3a047fa3810 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a51be816882caa1719b594a16e41d63253503dcbed81652b335c307e4f9c0628 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ef1a979b27d4014f642ff9b04fb3138116c9f4d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a955348dfd65f0c888020c27cba06340ed28df8cded080ba399053a629ba3e7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b913a4e54ab6d8d55987b6b51e1227bd1a098437 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:080c4e3a1a5651d3144cffd1fe878dbec3c915a17e5ffa2eee5cb8995730f042 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ee85a1c9c6314b55586456a68470cc4364af51e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27aeda5739b5b9ed07536787bd952ac66f079b4a44e2235ba7a18a554a7cdf00 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..096d82e4a4fd14d07775065dc4ab528f813ba472 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85e5d09a8dbe1e3f3142f2c5396ebb7aa1cadfa052c42f3286401ce3c3a439ac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29023eab5734809e58721ff6dacb55fc9c2c37d9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:777a0290abbabc3b0cb3f6f6eafb3de71a26b73410504ec9f3e4a1f4a0d94272 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a879c7cde4488da5ac5e7b5bcd96226443233c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79557aa0f7f67f3c5ab25698f590d1973d3fc9864bc2e11b36dfa3b1f729aca4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..329da51cd868f477c3950691be51a625279d68d3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21f9737c68d25eeeaec8c527cc27bda784d1fbaeb9abc8b08c32a2106926f971 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b7e28f4a25023dd759a2335309e080083b681db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39b3b1061125a80ca12a32905a096af28d0bf80532469cf36f5e6f3c4102bff4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..becc2af50a520c1367077d017bbc477c02df356d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4dab64f9e73ab4f9b0881289b77f9035264735acbed1a23f86318f6798d16f1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6bcc462d2bb3ad1bd56bc3eee57612ebc318470 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:331af1b8bfb21a117d88d68f25124ff3175d3b7898657a16625a12e5960c4bf6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6494a437c83c0fe6bee4e3777c1579360da86321 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a71bcee6b3987ad8f708338f806574440346de4a9a81cb36ec7629643000c3f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4150ad1f89d21367f4cd836fd4337446e7fb76c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eeb191b77214adb6595d10c423b7ba8483015a53c3e0505900dda417ccd5ff0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4afe753a623fb316edae4ccedfd6939428464ef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d7e4be727c05f6ebd9bea36fd3096f13446ce1e6d2902ba0788832666aa476 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3c79174394a8bc784c754fdea3b0a475cfb3b7f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cc41645842172ab54564981e2502e18c8c30b0adab13d4e96af6323c29aaaf7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f69c40c49ca158caafb302d8f07324cac9adc1c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cded3f0452392ba73db295d7e5ec7c2bd8c2c448a8bd51b76bd94b96fd1f2bc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dab393b44a57f38b6461afa9149a4d39c9452314 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7939018923a55283856e7c0c6aa3ebba44c23fa6342d58d676f129d2b994983c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd6690c7c38206c7f619fafefe4ee5ffe6087c8b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63b9a48d64c7888e67401d5bb2543203c0832b398078432de0ff6cd19e3764f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8208f8d4b794d48588eff911d6d5c01caecd73d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da406b71cc07a5c47ff1e1200951280ba668c287fe8ce17e0e865bc45ac1a2a3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e790945371d6e6f770ac319242827bc269adf6a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43264294612ba4e3ecd664584389f7bc7564382928f7fdd5eefb06bce73a9547 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14652a61e5cff38c825114de3743c6b9a1a4ae10 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e49a7a7359c4a65698c95e5b8dd9e819bd92515d2187fee9ac69af002d287d3f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c56396dd91adf919842b1bdee77170f9253166fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee4daaf78d530de4c51fb0c4be4ced8c926320ddad1ca2c7220539a0b46e7ca2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cda881f89c6db990191561a478b60a1a7f41323 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee321bfd07991a0df2920746c204ed450292da317b560228e22ac1dc349eb30 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fab0f43e3f1a6c59c8efe7e83d001ad849767d49 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ace90c05e86271a0d6dde359008c6e2660aded558a2d65fb5d380ce83cd75ae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d05a03e3809f59c73a96cc0b515b188b556d4d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:911bbd71b73f5b16e3dca11b41fca5bf4cdf097aac79e46859ce0a7268ea16d8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5364ef276329a37e54f54f62eb5216f2135e145c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34eeb037f2c62e1fefcf07f963a6f737f9e27a217917fde0682d9fcb184505bc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c465ea814d3126f86744d1cf4300bb158869109d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed33216bad95394013888de900e2c782ce2ee299b4782f3af937eadca707373a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbbf2d3ea86089913e462689172f285b1564b088 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcefd2543cc76e398b7b6d5f7f9e9f2b9288919667e67c93e6686d727d033a58 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a532665a49aa0ece2f87a42f59baee5fba3898d4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d6a1061ddbd6bcd95910a88d5ff464b71b3e1fe3705c100bb5d3f8a4245fbeb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb15b4182f0f421d981d6357de6fc553d41686f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01464a45ee8533939d7eb655455f8ea5679f9dccd402565bcc6ab4c8e8f9db48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b77a564f4da352bc4e98de0dcf373e3a72af227a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc310525f51c886d2da505b7e1e4b9896346b74f2842efca04da62869e5b009d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2efeb60bf090cfa2e53596b01e6f5e910a697811 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:349ad50234ff98f9199db6df0d88841c9bba60458bb85a381ea9fdee405bbefc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bec34e33fcc084d445651ba08e9fceb1448b9ac5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c72eae6e8ff4bb116d7b9c54dc0ac356d4fdf555f40b1e42784dea4e63e59e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b19e78aae1139315151d0db9621088e4ac41811 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91419a8bec956123c73d4ddd586fc691178bab61dc8ce284c877934f34e0abb6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f1a3586a0f779afcb545c93a0939f4ba2fea81f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae490281a520b20ed5dcf45e0d74cc5e564cd9b75c3341140133128e71a7c377 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e481bf34e8e29add84c60e019ef4afe9deaa7c57 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dcbaca68453729b7ad54e20f18e9d0f67fb509356839b0272ba84c4123defea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1654d08b16441340920c949f9f4ca9aa7c2b740f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6590d5257dc00055c22e18106968d1521f5ea3909ece1166cc292b90d1c68378 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91cb881bed9dbba887dd14d65c59fb56efb9842f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85f36fa08152a6af8ce74629fa60c2b6cd690365b66390050100131806bc9606 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d1210a08bbe7184701867bf07d8eedb05410c52 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6774a1263a0a313111206f601de6682002cb4455ea6386f90c480e663885b03a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70b1f436b869738746db12aaaeab945d9b86817d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aecca556b49b26a1f1381a37385a87fed00a37c3f662981d12dd258ca5607fd5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d53789616ed22663b0ff1f9dba6f264b9381bf4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:118a2f98916b9e1cf40deff202fa20ca0f4433464b121f81b7ab98a561f696e0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9c751de64335b16fb6cadd39805b99b0bb5fcf7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d373dadd783f71aa628049a8213ff60b5f6943d176309e6d4b0a3acc243c291 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..668f15490ea78d8338fffbfb5ee5151653b75470 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d570fbf65eda3f917748e96521f03341d9186a88902490fa575b9eee460b476 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e420f8bc743516d0ec1dda23ab4bdec88bc31ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ea03cbc6d0f385a72b3754d97ca6c169e611ee495e9a7e3f9cedd2cccd00027 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbbf11273a3b589c7547a5c293f52d28205875c1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e628ce2c0ac8a26116d2db1076db94aa1194fcac20d55f91d8cc447f13ae1b43 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81e08a468539d9c377dc00618ef33fe12de404f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b7b9c4d39dad178f32aacf60fe7171b28472c6441e4846010fd431d3bbc4091 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08292b4fb80f6fa1ba0284a69250b7c61cba3732 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4924a92157acb085c09979fc815668c97086cb16f7ff04e0cf0d6027ccfd42d8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..740e289216277f1078945a5411bcbcbb851c6844 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:497bd89836250dbe6e88759acd58e336bedb51306bba5145954bd1ddba5b40f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d68d076c72f44c4bb94d7dbe3b719eee0e29d64 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3783e3986318942fe23fb184ce308190e7506e9443722dc7fee463dbdae2dd4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cda4b617d56da6d798e4071fe8c972bd3bd82d5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be604caf0bc1e8b30d7494109430e92b52b9079e6671029c1605fb7fe4f1ef93 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeceea57db952ddd4da0af561af60f10d78d312c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1596b0d6b2c497ef39c196ef03d7967c507b0027a65aafa1ff231c4bdf449c48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e0cc52581516c1ef217bf1843769ee895ad8a16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:743d963ca666d8d3aad2a02c9e670cafe5b5e75b61d18eb2dffb8181f0712245 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4824af1866a50efe158f656c4b6e2077504b2954 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:114dcbbc4aaa45684452b97fc7613e73efd76debe4265fd790993956b16c6da1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db5f6c5f66f6c7fd3a1b7fca95fa4364fc523856 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e4f99a3f364fce3d2c23ac106e042b430b58ef2d43807a2a7eeb74eb2e3f37b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c0aff71bfa7713a64779aff406beb91c06619ab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b75c54ddbbda1c29d0b7f77b97175f27820ec851e75e7a3c213c37655646e51 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8030c0c6e218d7b9cfe59d8111ce1477ad17f377 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ecfc1713653559f7ea50867e9d33499695e19b0ae07e5e9766e4ae5537bad9a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7715fbc4413a98330822e64d9a9ab0660d025703 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93d1d2cb540333ed1a825f292c15c3f924da6625d10bf6128a996abcdb0eaca5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61f3cf5ae6c6ab9aeefca0582c2f1b5a347b3f4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57285b47a77bbb83706f9729390093ba2600bee32a1ee3cea493fcaa85a69075 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3cc46839a2880965065cc0defe3df08bd57e754 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77aaa797098b71811f994a2f1e7c0565bc2916005c840e49dbfcaf797dfb2a17 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5f237b7835e996bf9c9b09c43d7b9405c616cbc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f3c60258004a70e1ac6f414faca497b6960ac31d652e9d4812fce8f1a2d884 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4473abd9ad76872064092306758ad7780bfe6560 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07118840c9e085a30e212649f5dce317f30a7829c5a634ad93383b3910f28b07 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a887f53e0116bc829fe655d6e31d10408eede465 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52977e6a7c655596361f5fe55eed8afe18cfbad8758387849ead03facba80db1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c12846d8506dde417f136554f997ba6669b14906 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78754ebe4e699a5bdb2e26fbfd5e05e83ed694a5562a457bdaf2b814800f7977 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..609dae3f1b48d22fdd99c4172473bbc4fbf46991 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cec1181d348ae13428324c9a8f2065f74d3152883b9a421c7694bcad6a807975 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b692145b56a84bfa2167e5507236274ab377dce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf718143a6bd8b9d85216854b77b59dd66cbda8f4bd495812c5e6a748a4a40d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a46149c2961efd2156d039eb781d7176184fb9ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:998d2516f6657c01c2c9a72ecabd9c642b861a666a55b12cea502ab704d7ba4a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..597ccde4242be133239c40b2bf51962f7fd43578 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3beb88a61cc8e0b5463154e43f563a2f5e3a826fbae82b3fb5d68d9e16f3d5c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50d8aabbeee37e74fe0c4df0a9b3c4c496cf37d4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2618f32fa71f421a2093a86c43f307eb722c4d7095181bd3c2a1c9651c6f702 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ddbe3ea7f0fda5fe26c87ab59e0cba8da5ff1e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1496a3dc2d186ff9b4a42c34780e1172d46aff73c1a80fa27b5bc72e5bd63725 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa428b725e4c864ff3f486a886baa099a86cbf70 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:929aaae910c7cbbf08086bfcc49f3b18c474a21bf77df2c30ef0cd840a25b277 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a1916161c8d99ed9a1d3cde20db040aa1f7e36d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:482646bf04572ef77b3a66a5c45540d87ba575ba10a8ce873c55ebdd6bb0339d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e867edd22af4ceda9b3bed3c7096fadbbb7d6735 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe2d0800bb5c6c52f71431a6e04a1c52a95cf992ddf07ac98e31c9017a406dc0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4d39cda856acfefcf62180c9b0bc9ea1462e297 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:816fd71d03b3c3b0f07a87623179f9775e73211eafa20bb98e05ac716bc8129f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1c9b0541a8b8891c4ee4a1c06aee95df834a575 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1979a992ca185df696545be2a77aea1c7c555e8efbe96fcd145e6f3d453adae +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e70a092c8047ba001bbbb64cc0081829515f4a1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3ef8b0221f6fafe30803a3005b87d9c6755372994c93067512f0c3914123c86 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..972a649dd8694c25cd2147fee4a002f727e92326 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1323315edb4a2c49e7ef9de7f8c3f1461387bb64db4f98891a5e81f6cb39f84 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84eb4a503f6394472ff73bb8a9e153a097d8275c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fdc95eefd7033a7884fe2a3c2e4afe88100477e2cef1306a311a740a79838db +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03a288b41b3a3d4e91efe4ab81699ee772727d4c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0ffd4d91049f99bac1b7bcd9fa42f92ae2e040d6a63af7cd9da8d44d87b193e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee743428c2a03ffb1fc51532787d87ddd650a9eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e36e4a56211c4110e2fe0e98f1426154251e0e2c9212190ca46c32dfb12a015 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6700a680ccf5dbecd66f731120ca98887ceae38b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75eceeb05f7979f6f1214390dd01cd42445df6e96b4709a4961d9aab9319fdc1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66aad300bd660e3e1d871246d69dc24c6c4ab616 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e71ee89197892dd83b8eef0a9312a1618221ed390525554ddba8dd906490ea96 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e3d3c2a516a418e8412a3c3bf78b1dc4963c591 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66da3251033cac64495c9369a4f660f16d5d9d37b3b94bf33073ffca5b85fdf6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b3259088f5571aa87d85a73ac6c974c041d263a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c82a289e8dfbdc1e9e0edc46d4d96bd16872ac6dfa4de5e992e818e64b11247f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38563d66dd984daf11a19a6c121fcac1e1769539 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01a53095890afbd3e2901ad23d23a4188ba6c2617d5877738eaf31b6846a6c20 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40bf806a1de8ce8abc4544def13e6920b946045b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d66bbfa57e211909333f429c65b1819819c7b1e00bd6add0b1c61e994a6b92c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84ab8773eac1082435203f2d4a6ec8df84e1bbfa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9aa42600c323d01509949aee06e11cabe049725a377370e7071959bb91a2229 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cfc4e266209b91e2b67c563f7bd788450ddc80b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b68d4508e838ca49e97b8b0bb353445484f12ceac4b2a709638dac171a9b9bb1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31f397811bfdecef2bbe5275c270cd987c5fc98c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3af7a08c34b7053da33d0e05ee608a0024858fe06a43b95dd04ed5a171069bae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83415235938e6cf58c2e63a21511b7dca21c2c59 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fbc6e5f3bfba3374aa6b5f03c2a5f4e60a5507480a493ea0ec40968b1bb0cd3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7ea6d223263ebda2ec5a64766b2e284bff84100 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:419a4e8d52e208e49a42f8c577af027d0708c37014d135f62e4dc20db3f1793c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b848bb7b68c2fb9cebe657f48beef47cc0d8b8d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:953578f1b2bd624a36756e27f3ee8416d229e3f980859398d3691dfb079e5f3b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2c6447e5861388305e035dff1fe040c22f18cd5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b531b4ddf7de5330d914a28cd6f25b349c8acc3f6fb77c980390ea54579d8dae +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..efe619e27b480a738333ca7d0ea03f5f8d7f76f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d408329ad2f0262883ad734d332755128219228074db84af19bafc6ab854dd16 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36d41bff228a92f35fcd596c85801d5fadea5384 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94d95b7e9bf20f88b9135e35ce7b481d19e519c7201318eadccb9d7204b20281 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79cd6fdab778438756ad31a0fc15f80073ad0e92 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e414beed0148c6a7f9213859a291f0bc7dc90529798a348278bcbe5e6f6a5c43 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f0e02c29b731db0845e5259dcf9b472c262f236 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32a5e8cdabb40a3fa21b542acdfdfc7fdca951b118802d2411607a4b13b06e89 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c59b440ccad4f3011264af1dc9b38cce9ea14cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d05a6c25bf7fde3cb6a7b1635cceaa14b15a8c3235c4ab026396a312ccf4746 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83f32ddd95ce0562404fa751f2e061212cda2edb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2c1144175461b4e59da20e4311dded193cea9b0935a5951d031a128ee4252f9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3e8aa130445a578165b0d29b416d712bd089d08 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9950da8490d8caae1a3336a8ec013ce9ab9f340593a1ea1117b1baf5ad960e57 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1117fa067bc25b2b1aa87af470e2be24d092286 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d733d56250307fd62159e5e704bcf263af66078bc92027e2c31acd0a0785b3d7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eebd7d4ca8f219a9d435416e539be42511d408e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73109f95d2628b79abc3d498000b8f196bcf6c606d3cad97fc691821348a04e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c0b7c3f247cf336ffadb75039472e179ca92294 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9341eff32e788e300fe42f39f9e3d1d099ff0946de56f74e5c873162d0c65c52 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c73347d9085c9e326e7a0e6ae7a3e231a5a3160 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c4c43caa28f8928e88b85752e00b22728e2aa29f8972e349f104817b6a534ea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c007bfa7afd435650d84d444e99ff090e9aa30b4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11af002ba867d34e029188b3770623ab617f9fb9191ed104c5e96939e3635cf +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcd2343dc264e870c168d0ef6a19bc9b3bae998b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e88e05f4b8ae460a691f5a530eff527d17e287ac9b115e46b2ad87f759111046 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..adade055f63574bb31af0c59cb1a40a716ed2304 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aba89f449e51a94e6b0289ad329e6feeb8932351dc82f19398ad575a0dd1a55 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab067f0562ca0500400248f21f84ccc5229061c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df72b20f54e587d3feed26b5defce14bd8aeff7839fa89830b6e9550a260755 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32bd206cbc8b93fcebf6894d44facf6917edfb05 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66d76b0e9613585898b5253ef7513c63a8c70441a30ebf913c97dd1029ab6e29 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bd8e874fa6785f351482002f5a0da9b3affa60f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:780e8e8acf1a6ec24de0dc8ee1e0fa90d8711e7668e1047989282f1230ad8d95 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a21f7e85225538f8b7cce152dff1bbad9ae0d08 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2193a1556577bc3ae5c1c664d17e9e0858bfeaf5314b4f8e5c1114da85f7d083 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c44aa173f0e94906a90abfd900c8f91182cf7eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a92cb655c2972e9746c2c5d782dda31df085aaed546d992296d14053532e740a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bf2f5a639096e5e58bd531d1dce89cd84f41cfd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e3c733fa863943d724b40283e89ad420c28b115cf4a6a3d0ab39431a9e5598a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c621051e6ec3c774579a2ed8cee1e15ad7e9d124 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df2da115ad28cd23dfcb34dfd7b083a5c2d66e113bd9d0dbd0de646f82284a33 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3fddb82a8b3d37e03afccfa7d4c7db135e4f2a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af6ee028c41cd1151ae5f92f83631f0124cad9f02fede6981bc9fbe3d07e49a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eff60299284dd73a7b8039db5a80e2b725bdace --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3240adc316b6c668d22af0dcad57a9af0590fc3e27c84848fac0375af1935782 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54b56fe7526b41bc2be3658c1d8ffa6a9d5d0bad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f016ae1f7142bfc400bd9258377d61e637dcd09ed2a3eba544f0dfb7bd8154c4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2336c38938d4f30d6320c93ce1f8623bc5e9a1c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bf255d1840bf60254ac685f0f55d63f9fa511eba37265b45070b5e18a511dca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d9885d2e061abe408d0a1e31b2ee41552fd7200 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b602e7510bccbe46b51ebaf823b0ac611f0f94f15e3c1e2c902fc3f8451463 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a967242acd767a27be2b711a7f171499a11aba8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b5f3f7c05eebc9726d04128a27c47deac96c25380c88b7598709c5abc985b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..380dec4a05cebf5404c0c23c44a2b9b9fd772692 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c420cd4f72b5856d237a6038c624f6c2b2960dadd8a5119aad587990679d0c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba5ea83a072d7ece35268e24da5beff1f5e2cfa7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f12ae9559c17383eed7f16be62c2d8f0bd64dacfc33db4c4382feaed7ffc1621 +size 11395