Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/6/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/6/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b087e7e2bc6dd436f2ab8f995c498e33dddd72798e9e7cd561d27252538adff9
|
3 |
+
size 205955
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:978d5fe4c7e6db72667a8a849dcab3227809febdaeadd087b768dfc48b130854
|
3 |
+
size 205955
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74e1526623c769a1149bb29bc8b26b02217529c1dbff64962955534f9bdb1646
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:936cb15561a76e0ccbd18b2b51e1a0b1162f0a271eb4c7191b6b1ae36065e2f5
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5476b9febeb4a6c02c2ddccbc8715221c65cede89a24b79d674ac8613ecef38e
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aaee1a529490351ddc268f3e3739c1285bc1f40725500b63a311191c17c6b8de
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2efaf369759598188b2d27ad3ca9e8b91593deb21001167e743a4e5e59aef45
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba758f3e82f52a07ecc5082f2aaf154de1d4117bbf30d658697be2d98c2523f6
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fe50e8c3c8e49666a3467d0badd88a4f264563aa4ab72f6b9881b296fc305e3
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31119f23b991bbfff4b5076f304227938716159d6d160284c9ba9a8d9e0d7e80
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91eef6b3dee3adebe7c27deb47819e83aa2e7978d4971a886975dea32196fa98
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a2689c25b92f3acbe58aa05c6d753b71086b93d749cfad683064a4bb81c43c6
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:601fc382b4fbf0f61753f6294eb4d7343060513974a6a49376a071acf2a3a3f2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67013a3a235b0b9e73a885982bfdcd0a0f4067b66277133d2f9c185f2de25f7a
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:faece96bed785f2ae7e47e0c83e1320045534eac970afbe5661f7f0e3ee2e390
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31188e68de624a57926b95e2f56cb2c47673adf6dd4673e8c9db337d401b9bf8
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:517ed040c7175cea619728ec7c8d89eedfc42765bd0f6a7cb29eaf0e97223aed
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6c8a1dfe13340cba7590cc1fbf7b59eb3d85a8a60dcc4baac9de9d1440d8cb7
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:630977a4947dc00056c271a1c9c7658ab5403586a5e384248c0bf0c007b4cfc1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b65ccd046990822d6772afd1d8c66c27f4806dec7d08303a644accad8e7d8fb0
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64b711607cb02f3673887183cd35b21e5eca1b95734da908685954480beadc0d
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8cd462035eaf9824122d4d6d97e6eafa351fd828ebd2caa2b77afb8143860f46
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e85dcab8dfd15ac3b2ef926384f7a6a287933f33500d0ed35220ffa7d4df88bf
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d02de1c32a6aa3346ad2c95421275bec56ee75e97b5dc3ed3679734522bbcd8
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18ee6d55e964301d4a148b5e029659d38661514dd1ee6a40c1609bbe5b63110b
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a50ffb18f42d595f0aeb781898054564a7f1c64bb7e6768fdc9d33546716587
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35ddf1cd289f53cfcb198e5dff61296a48d7591fa996a3084952924db5bf0141
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1
|
3 |
+
size 11395
|