Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/6/rnd_search_t_no_sched/comb_11/init/lm_head/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/lm_head/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/6/rnd_search_t_no_sched/comb_11/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0de85d6fe6c256812e9f8428bd42bb83b846533f731584996729c1488fa6fc6
|
3 |
+
size 205955
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9a9c8cdfdb62fbdafd0d355be8ea28a6b64e45b74086e899ecea9db8a8d3df4
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f44831dcc865460400a4dd7dadfa6829240e33beccb95bf9f4dbb8aa6811a40
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:455c7e6e49897ca6a524d8defe3fa177ece6dd848437058463b3be71065dd17a
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f720724a2417d3d781b450fc655ca3e3d5493a5fd10c8d0df8b5a10756834da1
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1287f0664a8abf1285f014112f7c3da14088090423f77831d6b81f5b556d7cc8
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:014f88b932609224bdd05aa41f3e035d61a2ed645c4ecdd5c6791e744413e136
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4342adfe2e1e9287705e8fedc3f3b9cb5ede53fda945989261257314266beb8e
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0d255da59638582b221bb8e19c06ee7d65660dcaa4f960268f14156fa562a87
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d877b5b209e20581145ca6503faa9d2fe302e1d2fa92543dfb60995fed3f0c52
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ddcf127654a53d4a1c043c8ab6273aa647297eae59bcdd211ab963a52171f1c
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cefa623dd0df90ef171b758ba93f9146d41e46f528be733efbeff8d9487c8bff
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9f40cd8f9041e09e17ade7c2253e4f0f86e63fd5acfc9119991986a226516f9
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64371fa2369499acb4f752965b6942591a7eaa8a0abf0112e2cf766096551f81
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31c94775d719fe05b2fa602146da630c6e2521f839391c4b24d40a09470b15da
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ae4d1076ae0ea968a1bf9ade333302c2f3c2801dfbb56d478f6ed19d09805f0
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2f5a585f994241aff4c4e6718ea8f08ef29e065c8620052a9eeb55545e62bc7
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a33d2fc70d93ad96406aebb0b28cd70d39a17f3443b25b5096ce861fcbedaed4
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7c49827df14de9552d1dccb62eb2125426368a5cf07ec7be3d51a3b0257a6fe
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c112c1aad45202c1ed8b6677e4d54682e817c16a99001773c2bbe3282cfe4aaf
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19808614a9721ff7ab7d8de6d360bc460f33c1126042ae5226812e7a8b8835cd
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15e3d9def26838b4f6652707a1c466b31e1082823a5ec4657f1d1157920e0037
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b89523f92e33cb8a16df05dfdb7e1fbd55c5a3988c472f43b927b201887d712b
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ba861e6f40df75a873fc5c5668de4819ac878aa501239fa5935dd0f7e900943
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c873d66b213662e3b0bb10babef4d9f28795a4348684aaf2e8125026591e21c
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4dcdb4c589b416065eb77acac3161e28fe24e11f51cde3f6fb816296d81132dd
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb43f0df21ed3e492a800dffb06adfd6ccc6a2a8c69c764af5431712505d19e2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb5be1e7d01377e08e1ece2a9fded1d1b155219164e32466c6ad2ab28d23acf2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25ae4084cf581b7b0cdc915684a7ef01464df4e16811fc1c00f6a13bcec86506
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2aa10abfbc1b8dce876a9390ceb0bfbfbb26415791b5ad719f5d45cdf0b143c
|
3 |
+
size 11395
|