Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/6/rnd_search_t_no_sched/comb_14/init/lm_head/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/lm_head/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/6/rnd_search_t_no_sched/comb_14/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51485fdd834ec63e996031ce16fc2da544bb5d1ecd5ab2b227af205859aabf6d
|
3 |
+
size 205955
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbf702ae34ddf73874c1c829204d31439eb4375080e7efeae3eb5b930deecaa3
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8276e092eed6f22c5dcb8dd751284721b48c0388355a6a79d8d2de161e478f2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0eed194bcac6630ee4f2efe7edc966c6e150b8db4ac2ffed12cb78663be9db8
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e70994f35ec110776ceefceec2750ea5fd8f15f53e9b548caca307953c4f7132
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37ee967f3ac03f11b0b3d3d1e45fcc19e353c682c08241c32f409ce03651a073
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee3929ec1023b1a9ef82aa34228806934aba115f6fc3a45fb6a7afc191b96777
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ddc206e5d38a66246b315e02136cd78bf7cba78204233b9e13289dc766a12c6
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da36ea30db3629b87f007fa2b5e3425891b936071bb371ab6a452981024a6495
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f90f2d641ffbbd7626667a456476a291c4f9d6f51c024801d54d2adf2c37d14
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b8710183d376e4e861f1ee2f17ac5c0d6711466614e6370e3cf8efc12db0525
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdeb8619c9c4a9212d727f9c0eaed34ccb32739c13b2936c99c46990e72ae66c
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d15d06190c26cc906e277c3fefefa30849564d4af99b1d9bcf8f7b8e094797c
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5b26a5fa97df45a9f6d8c053be8d927b571d7792a6dbcf7421048f04c45759a
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1dcd9207067fc32cdc6e3998c555d9287395bd54e519c2cbc95ddf6a7542ba1a
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5b4b5f9c7450124398ad28307dc259c67c5070b2766e6c378cf6897f6f70dc9
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0da647c08e70a69c7cbb71c29210b22bee04ca1fb5c475404b012acfc454f135
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5aa8fdf09601e39659665b9c285e1b9c431d60936ba5018ee40ff8cadc71474
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b92b3de360c74d04be4ec7dd3f70c8321efe28680fb4e3d4d003c15601741bda
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:206fc3b99a0453e9d5dd81957617896bfce4407d17aeca33595f8dceb95667b7
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:993636e5eaaf8df06503b4286acfcb16a20e5ed30beb75c4e432e302b7b98bd4
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bf4db318fcdbd0605a42042459488def58bee224ae6b3a935dc0159de28f05f
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d20656788b8fa44afcb2501702b775b53aa9d0516dbbeaccee6d8bd8770edbb2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8ae3dc765858513db1a2e60fcb2fd19f7351a8a44a3b14485d79cc257dc3d3f
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4d647be3c28b4f760069595a2c2bc9f1ea8c612e103199287e796708a01f331
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cec95e4363bfe473cfa81906a76fdff8575f242e25fb1bc7adeb06f777af3e4
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efdb363078c957df94c9ede3462dea93483360959db371cfe23641d098165145
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cb64e770dc42e846c3d9c53346991fede52c4fc3378b84ccc91ac56eec72fd8
|
3 |
+
size 11395
|