Upload learned parameters for llama3 in bit 8
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/llama3/8/norm_nlr/comb_2/init/lm_head/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/lm_head/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.mlp.down_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.mlp.down_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.mlp.gate_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.mlp.gate_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.mlp.up_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.mlp.up_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.o_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.o_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.mlp.down_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.mlp.down_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.mlp.gate_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.mlp.gate_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.mlp.up_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.mlp.up_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.o_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.o_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.mlp.down_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.mlp.down_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.mlp.gate_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.mlp.gate_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.mlp.up_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.mlp.up_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.o_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.o_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.11.mlp.down_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.11.mlp.down_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.11.mlp.gate_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.11.mlp.gate_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.11.mlp.up_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_2/init/model.layers.11.mlp.up_proj/_s.pt +3 -0
params/llama3/8/norm_nlr/comb_2/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66ecbaa863d39e4d47eebf9a4356857a13d22db5d94a81c1d138fdc53328cec6
|
3 |
+
size 514115
|
params/llama3/8/norm_nlr/comb_2/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2f1cfe067eb18dd27c4e6e9296a0ee315ea15b3e4dd1c67beea53ab3b9c9106
|
3 |
+
size 514115
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.mlp.down_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a1f89734062f512c80f275148f142ae2c35b2cfbba68b998d7a61ce7f806082
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.mlp.down_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:565bb424841d0f1982966eed201105b334de4026431c2ebbbc361ba40c801093
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.mlp.gate_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaa46ca73b880e3d45c366d1d3d9d538b21235c6f696675ace1cdfbcd33e9579
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.mlp.gate_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:346082ee61ff83e8e4f8c66a9ab5522deeb5ac0914340df408434a7c8e01303b
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.mlp.up_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaa46ca73b880e3d45c366d1d3d9d538b21235c6f696675ace1cdfbcd33e9579
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.mlp.up_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ec65a7de1344c8401a9ac2e7ceef528de146c0bad3ec17609967972e08d867a
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b2bf0dd42b7e184b6475179e63ae6256dc3660f9bf7985af0e984775039bad3
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e45f9a9967f9455728b4fc8c6e87d02e42960d3e6fb89c073f9590f4b2017ac2
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.o_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a1f89734062f512c80f275148f142ae2c35b2cfbba68b998d7a61ce7f806082
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.o_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fa3eaf749627937c6cbdaad004a172cab65574866e212b4fad9d553d6aeb5cf
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a1f89734062f512c80f275148f142ae2c35b2cfbba68b998d7a61ce7f806082
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0af70058706e7c563cf3bc19b8e2de4b9ca0933e3f4f0668d4235867ee5b3cdf
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b2bf0dd42b7e184b6475179e63ae6256dc3660f9bf7985af0e984775039bad3
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32187f7ab7979b2c36ec982f24f081e45d30f2cda3da3534cf426a13a35ca0a1
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.mlp.down_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a1f89734062f512c80f275148f142ae2c35b2cfbba68b998d7a61ce7f806082
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.mlp.down_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38cac571492b2281186c064a56f82b8af58bc5dd6523dc2dbb59a4ca3573c51b
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.mlp.gate_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaa46ca73b880e3d45c366d1d3d9d538b21235c6f696675ace1cdfbcd33e9579
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.mlp.gate_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47e14b3488bc6811e10b0ec27ec1f34920743e8cca30fab9ff047a8b2bcbef73
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.mlp.up_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaa46ca73b880e3d45c366d1d3d9d538b21235c6f696675ace1cdfbcd33e9579
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.mlp.up_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f5b2c353acd6c9c06c9eec87dba7b4621d3600ff25d147b58ee6aa636b765eb
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b2bf0dd42b7e184b6475179e63ae6256dc3660f9bf7985af0e984775039bad3
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2b1cbaaa7b6e7931abba43318061d3986a9185800ad839340ebd180a0b20f2d
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.o_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a1f89734062f512c80f275148f142ae2c35b2cfbba68b998d7a61ce7f806082
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.o_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e47caf589f652d7e294b6dd0757eb8e2c6e1c573f4c7d6d60c2c72ed9fc3d9f4
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a1f89734062f512c80f275148f142ae2c35b2cfbba68b998d7a61ce7f806082
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a592355ba5d3fadc335a2ec5c240be42c309087340cdb27cca0daa76c37c6fe4
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b2bf0dd42b7e184b6475179e63ae6256dc3660f9bf7985af0e984775039bad3
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61a6f793f28084f6e292ea515e66d931d3cd7cf92cdcce559547a11b0fcfc249
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.mlp.down_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a1f89734062f512c80f275148f142ae2c35b2cfbba68b998d7a61ce7f806082
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.mlp.down_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4fc71103aef54ac4e4d73345857b6c5d7be2bf6778ccd5b0b4bd6cddb996475
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.mlp.gate_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaa46ca73b880e3d45c366d1d3d9d538b21235c6f696675ace1cdfbcd33e9579
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.mlp.gate_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f0469df70d9feb2c1647576552d3d4190b70b92ba4db52594fe027e9a2e3eae
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.mlp.up_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaa46ca73b880e3d45c366d1d3d9d538b21235c6f696675ace1cdfbcd33e9579
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.mlp.up_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be6970d5f9224ea79efa49c5992b72bac31759188de87f1b30bc215392f5183d
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b2bf0dd42b7e184b6475179e63ae6256dc3660f9bf7985af0e984775039bad3
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:009cd770d00b7cdcc5600268d51acc916c9d227ce47821d59dfbd661b9bb2d85
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.o_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a1f89734062f512c80f275148f142ae2c35b2cfbba68b998d7a61ce7f806082
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.o_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a296bbe1730d1793fb25baa2197002cbbf76ff70563df0836a355439ba4830d
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a1f89734062f512c80f275148f142ae2c35b2cfbba68b998d7a61ce7f806082
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20c3d1bdf55f5ba63634a1b9f67cc463add7eff97fa411110d3a7441c7531135
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b2bf0dd42b7e184b6475179e63ae6256dc3660f9bf7985af0e984775039bad3
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e13ab5310e4db901d77848a668ce942aa672312a2a26c20f2021967e7cd405f
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.11.mlp.down_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a1f89734062f512c80f275148f142ae2c35b2cfbba68b998d7a61ce7f806082
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.11.mlp.down_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:664bd73d80759cf519e593869cccde2fba74c02f164fccc61df1ae0d7f91a9f7
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.11.mlp.gate_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaa46ca73b880e3d45c366d1d3d9d538b21235c6f696675ace1cdfbcd33e9579
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.11.mlp.gate_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be54b22ff5b8f73aacaee336a05c96e07ee16f259ee004b8c4b1d2cb1b809400
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.11.mlp.up_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaa46ca73b880e3d45c366d1d3d9d538b21235c6f696675ace1cdfbcd33e9579
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_2/init/model.layers.11.mlp.up_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f73cf8417a8c72974b4f6ff7a681f6912975d03e8268000ed625eb89cfaa3817
|
3 |
+
size 58435
|