Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/7/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/7/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80a5825bed9266e510ba8da5a78cb800fa144b0e387dbce29dc1d057ff42876d
|
3 |
+
size 205955
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54a12454337d089b1739075728d6e8c8f8629dddbd18c9dc99c7ee2c91b99b99
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c8e9a07df6d5b0a7f6339150e21db6effb73831abd2de1ec33e0317bfd3b377
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f78654a98eb8cc27b118d042f5146f0778030867ee7e62c975407d3f0359ef5b
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e82922944b3ea0f79f2bb9dacd1ed6eca0c29a113495bbf01ef96f2de3762e9
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a15246248129799317b50ec07d34c899f3b6ec7df704365b56a966b4a3e2f6d7
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66ace67bfdf4563ef64a4fc2b349957f98a8790f5016adcf467218784711911d
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27c7b346cc67e4a33f8291c71c4ac52d6ef0dd39afd8ee09d0867b1a79a78f28
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f60f1949d94073896f96e11cf5d073bf9dbd7cdcdbbc213f349d8e730a1867d
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d43cf7eeb209682bff0421ffc5ee78e233b20ff22ed8d5be307d123cc287f85
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0805d3100daf65fbd0333ad35d81d07b374d57d4e37a71f85cff002ec990b4e
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49bb32d1caa1a602e6f2c6cad01d0e0e82bff7e8581917dc7868f9b2b3ca84a8
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22c5586e36bfe4b904782ca5ae0e60ff238691b94fb4cbe86b162f350a48fa07
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5cb95e8d10e6fac7e54420a4c554651a1031d5438e24ea862a606844b3dc3f0
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5214444581b428d6136226c3b74e0c95df25ac0653ec9e58b96dfcfc06248ff
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8351a90f444b93ccc655b96ec7cfd5d41c3db2ec1474b9d3980057d59af46645
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:957ce5b84a70279d2180cbde93621a49b8eb3f6461fec51cdddeb793b631242c
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1372e9d40a5b522bb051759a748f5e38ae0e1552fa9ad1f7362c6ec163540c32
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6dcb1c201eb81e1e214853d14a82bd3b23b85a418c748211fa44f24d8245c806
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1582c8227042ac258e3950db98408f5c2f00a7207f15e0dd0db2385d3a073ed
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7d49ad1b986913046106ecdd7f98d6fe9cde7fb1380ab7f7c817586c92db3e2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ff62f51c2f97d73eb5141b6cd502c0d0d270ee13b3e10c144bc67f57ed991b6
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bef6abcc522719972afeafaad9a54abd1767be94955c7dd3dbb6cbff13c9fa8
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66454473e33e62e2640d95bcdf8a6a5dd74696e57da1eb85efb3e313327c74be
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:430132e3256a7a237f7839012b375a961ce89dbb6d0f5c16bc0cfa4c0a37a9ed
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:946895e78799e18a808f5e15affd5a879c17b629a91170ce0cda6b11a863430b
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:465e93456d7e0b7d4052716de9b816977b1965c4bc53a31d16e17d8437177dc5
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3817034a3a3a10f6b2ec85ce103e2ddd26c401ec4363d45c6f04ed236df8649f
|
3 |
+
size 11395
|