Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/6/rnd_search_t_no_sched/comb_5/init/lm_head/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/lm_head/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/6/rnd_search_t_no_sched/comb_5/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6a7a96655e1866ca27e8083357ae1a7c48bf7c253cf08e272c0818a84dbbce2
|
3 |
+
size 205955
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c7846bdcfe3a35e178fbb77b2deb9a1eca0442cb9fcf1fb0bbb549e8f1bbb2e
|
3 |
+
size 205955
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5aeacabeea574f4cc3f09e9840ae2e801f7195777895ce9458311d17a2f4d933
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8d6573f42159a582883ec31bbd1e6e63018de370a0a0f315b9859ba881a90d2
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9839a80b252eed2841a82a2d17bdb08e2aff0691aa87669dcfc7123e5ed44224
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4d2ae9f9fec94b8bf9d6b825d16793d1a2767862654e663cdceed83833d1633
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8126beeb659ba5c91ea920bea1b66b714657120546f6a96195650c6245c0c0b
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:042db0cee25b99bd0ca0a683c30698ae3620272af8908e3ea986bf00e71161ee
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7fd6e4eec46c55d8f57ab770a198a5654ed35ffe80007e9983b8b303a80cac80
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c19fa697f2b8a519a896ce70d4739e8a41a0187b5074170403f3c56cfdec25ac
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbb75d96ff2fbd4a4059d31044e4fe6eb0a897532d6d784ff8a05933470962ab
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d27c9ff58e70739096b760248cbdcf14889a816f32c6371fdb1674dd2e56d972
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c2f74a5ba5a3ce57f8305e5e5b5b1207fc930c6d4a1785eb57100b4c0529c15
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f42dba665f1a42282375fe4ecb662174fbf0fd0d11a5cf73ea5472e7597e586
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49ade70013266b198989c62e7c3683a8896e43e1b0f3eb37b7270bd6189f5040
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fcd6581d0ebbf0da5cbe43a92b25ecb99e13c992970cec7cad1df1c077835b9
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:291244753b7d77ab38f0f93d59e045c1869b2b0edb1d0d640b92f775171ee21b
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:698d91cf517744428b098f1ea246ca15b0db2a160c6211cd85ffd5ae5737dce0
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9499e5f6c8fdab0ade30d9c1939db4b0b867bb8ae691b4c3b43101db8b6b981
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7908bea62acf4010cdc71c8f64aee54eede73b565651eb8dd0b9f54635a539f
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a75cbd8c2fe64c3445c3dd864a100fdb63685a757655cdfb41516c28679ddd8
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb6a229e94f7b278f14bc4252f220ad176ae968f38bb85f631e53b6246b6393c
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04a80c65327c625642d035e8206bc9ca64e864c028d8b4a3406e8669b03c7215
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3c67e77db1e65b0d7e3ef66dd00391676dd7311215b5622bfffaed85e1f1fce
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be739be2bc000e184df0c1906f2d27fde498622c58588e4f530aa1136b9ef0cb
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a813c7efa0b3ad8243b2007a3f57413a577c7c0307190e76009703d9460737c
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c9bcb6bcb600ffb07110a26456f23e9072bd867d488cf62cd3e265d161c7c3a
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9115dfb212899ffb360d968ee1f191e1c05f081b29fad05e1659f1582e94344
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b3e7eb322a43ae2b6315786610c817f0f41c6852b1b7fc363aa037415972584
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26560d5e3301e3987452b498197562afce9cb6802fa7a2c3e2022df579851ad2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5f2e6efa120d0f1f64f94c75254890788d379e8ffcaee39bd20d67cc73d476b
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c334d456a55ca70a7225ff12a058de95b94693531f71ef9b030e6e664fd5ac9
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f1c18f7876c22f60318189c7d638560626d4ffe048ecf33ae1c889aa4468560
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e271b3662fe37b28996bc7534a1947f7bdb9aea7e992669338b84e0c94b47276
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:049ca7738f944df051e00cf484a6f96e0df55359e5435b2a70a8b2ab2b044842
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:124ed1da711701e4031baaf520ea4b59c1f6759a11929d68fd90b4bc1d34b661
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bb5154de17cad2e2cf74e8e2def524bab84db099d4df1c9ba055c1f67e0d2f1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7eed0989a5110927498cfd58f50bca43d3e375cff6f32b9121c7c6b72941ae46
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e44b79ee2b542b5f233c6cee0cb92915aab5337ea93e338bb57caa3c1638e03
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85d62d6fe4d2f7bb957f53ef458bc65bde5a410fefa316a1a4fbecc0a23c0300
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f6e4375255e00d6deddeba01225b23173c4226880309b4716baa58f71c57117
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7ea08a83bcabf88f1eb99662d4b61b3e3b4d9c5a1d4b609fe8c7cdbae773b39
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2e93b368bf17750f5a261d079bcbb1fb1b271cd23caf6284d9dd85c76a98aaf
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:190034b2da4c15424705e3f6ebba1e092cc548420919d20717af502de561c3e5
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df978fddc485faa40f955dcf967b776bc1c8364b458a3761b9f9173dacce708a
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b93301c966241676cf0d60e1b734854a63da73f10278e3307e7a9441d483a39c
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b020b4450fb788ad45b3c0040b7b6cab31513d3960950158bb239cac4914a836
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:959fa9ee4d6f7f1952ba4588126397d40678b7ee58d5082325c4571e1976d067
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:751687fab42425b2bea245f8a8671525106af756e938ee7b0ae4efa1a4f96548
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b767449575c610876864ffc756d0570b4c4d8978bee3af404b0ecc02b2d2d964
|
3 |
+
size 11395
|