Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/4/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/4/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62588dedc783584dae27f3d23a226c32574e40ce323be72190800b9afc6a9021
|
3 |
+
size 205955
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:058171cd18bf5e9198f2a8295f7b3e9911bdbfd82283ff17e06d4d4cb5f70c1f
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b67b588161abdd597005966f5109842aff19c10b0544c0a9b6d0ef91260935ee
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85400073b12a2946b828cecd3af576549a350e9caeb9baa7805e704f78bf5612
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb86f07ab8da41b8c38d544bddbf505e1de1c4b82ad6f436545995040074d6a8
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9bad0700e4f7d96b59bc9e70fa4c630cfa9b3421f39ac6afc37c26933d244d0
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66e3177a268b8878240ce92a5d364b47d136308593b3a505cc464b97eed5d552
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de94ed9e2785201c2e9b0cb152588c0b03d33055aaa2cfdc2e774c73c4ac11fc
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f92e32ed9a68cbbe9f89a5632716787ed02141cba5283dc7a35a2fceeb54fa4f
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75d0d2c9c05e779e12775ad6ccf0f0798f322e060c05d70bbc5063b8a5bf5c08
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc51217eaa0eac1c5383099a385314908c341acdec138d07f43522db451e5d8f
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b66f70ae451e5e7391c2b747ca5a6499b5ce0edd7807dfa4cea987794949a10d
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c13f5c22a99f97522b84bbd365ec394a5ac00fcf75996fe620dccec6ad4451cc
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e7ba4111174012f68a555274a22854073cadee34115171cc318763646a8c1a8
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a3dbd9a29fdf8264118371ed7577366eb7a3fe086dadf3344cbb5482fd2b314
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f01a1739478e6989ee2b4b0261ae3965761a71492af28ba226adff2575b2ffc
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f43fef3a3f905a06b6a50b6f5837aac24e56e982d865ef6fef78aec32a101059
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3b273c190d655c5fa261046425acedbe6569085a040fad58d72e1f5d37a4490
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77feac19e2596c930be95ed91d5099f6e1e2fd9bd742a0d7432b502ad787ed4e
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:094405c736b567bfac6ec788d3d360a5ec6a58dbe549068284c9229bc6e6c173
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48c2b1cc354135684ecbff2c221daca459f5c316482821174119b5cfa6246a21
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a40b19abe7b34c47ee90b948e87a6cb8fc490997418cb02552f6688de551ce9f
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5943f1fe50d05d9a1803a67728e5ccea9eeb99bf4278d3e19cd516b6c08c7d0
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f2463491be57644a78413288df310b6d3a2b041af44cde6529927de23eb8fc1
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:232a51bc25a1a069723ae0c47000bd59e340e9bcdc42f3a78c5e2b8b12c77cb8
|
3 |
+
size 11395
|