Upload learned parameters for llama3 in bit 8
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/llama3/8/norm_nlr/comb_4/init/lm_head/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/lm_head/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.mlp.down_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.mlp.down_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.mlp.gate_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.mlp.gate_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.mlp.up_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.mlp.up_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.o_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.o_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.mlp.down_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.mlp.down_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.mlp.gate_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.mlp.gate_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.mlp.up_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.mlp.up_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.o_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.o_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.mlp.down_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.mlp.down_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.mlp.gate_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.mlp.gate_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.mlp.up_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.mlp.up_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.o_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.o_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.11.mlp.down_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.11.mlp.down_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.11.mlp.gate_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.11.mlp.gate_proj/_s.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.11.mlp.up_proj/_0.pt +3 -0
- params/llama3/8/norm_nlr/comb_4/init/model.layers.11.mlp.up_proj/_s.pt +3 -0
params/llama3/8/norm_nlr/comb_4/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b85c27d99525ac791a62b99e0a085521247ceb91f869784c19395ac6b00a546
|
3 |
+
size 514115
|
params/llama3/8/norm_nlr/comb_4/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68a9124cbe4f2f6a762b04f8f5a90e1496317bcf66bd10093925142ee31eb7a7
|
3 |
+
size 514115
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.mlp.down_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:066686dd4c695f79a94643bcbe7542b64b0354652e010175b913eacac3e64b0b
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.mlp.down_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:473e53cd029fa4d1dde68354b5db90323840ce7d99e1db24288a03c5ebeb7160
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.mlp.gate_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6cbc6f3885a92a1684da0acce4bc0154a81bae490ba57fda93e24bb4072e90b4
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.mlp.gate_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e55ea395d8289f0eca110af10ade357f78dc173c47d08de0fcc00d99053647b6
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.mlp.up_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80ba8870c4695010fc9dcacba46e0026804cc3b394f83bfcff33b328e9bec49d
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.mlp.up_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e55ea395d8289f0eca110af10ade357f78dc173c47d08de0fcc00d99053647b6
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19b5f98ed337b7fdce066506c00d1830a1abfb548d6481f58e5435ba41cd9eee
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab76bae749f7fdf73e7e0ba4dc8a069296c020a908e22abac92c289e0fd53cb8
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.o_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7402b46f7b4b45bc435740a261c810f7caa9d93dcc62fd332cfd4c608ce6dc2
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.o_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:473e53cd029fa4d1dde68354b5db90323840ce7d99e1db24288a03c5ebeb7160
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92ddfd8aa61a51a1e7becd9a23f7b61d232e50d1b2e2bec6f1c82dfa0129b9e5
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:473e53cd029fa4d1dde68354b5db90323840ce7d99e1db24288a03c5ebeb7160
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6264d776e21d5fa5f42e0d8ff0e8e3da2444555888a2419f08a87c49b5873e2
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab76bae749f7fdf73e7e0ba4dc8a069296c020a908e22abac92c289e0fd53cb8
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.mlp.down_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:782467d7a52c8f41dc0d0daf598f76e8a97adfb0dcd8d73237903afc36cb56fb
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.mlp.down_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:473e53cd029fa4d1dde68354b5db90323840ce7d99e1db24288a03c5ebeb7160
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.mlp.gate_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:251635256ff47d793bbfb522bcffb92e42ce3ebf7c918aee427a93e1052ef25f
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.mlp.gate_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e55ea395d8289f0eca110af10ade357f78dc173c47d08de0fcc00d99053647b6
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.mlp.up_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ffa9950a59d7b6b821e5d3cd6553595c886e7d9244b67c5199ce67cef84e577
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.mlp.up_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e55ea395d8289f0eca110af10ade357f78dc173c47d08de0fcc00d99053647b6
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dea890d76fc16968816c7e92125638c5576d5ad60ba3a69fab5b4479bd81b48
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab76bae749f7fdf73e7e0ba4dc8a069296c020a908e22abac92c289e0fd53cb8
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.o_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6579692eff67cc609b777ba190734c93e800b9535bd0dd02734cfaa3df30ce6
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.o_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:473e53cd029fa4d1dde68354b5db90323840ce7d99e1db24288a03c5ebeb7160
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2794173f45e86a8cde2903688e485ab79ec15a97e941363fd3ad1139e0376be
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:473e53cd029fa4d1dde68354b5db90323840ce7d99e1db24288a03c5ebeb7160
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6a646165396bb9b9722941d31a1927fd3f0a333bc64883dc92eaeb4e3e5dfda
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab76bae749f7fdf73e7e0ba4dc8a069296c020a908e22abac92c289e0fd53cb8
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.mlp.down_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fcb83147261e3719248e81af6892d171a38028e88a709f347b8f1393d8cfc597
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.mlp.down_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:473e53cd029fa4d1dde68354b5db90323840ce7d99e1db24288a03c5ebeb7160
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.mlp.gate_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eacdbe448f46ac112f8b7c370f96d35475fa714b036783bf9b22c31acb8c596b
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.mlp.gate_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e55ea395d8289f0eca110af10ade357f78dc173c47d08de0fcc00d99053647b6
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.mlp.up_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04e56d83b4d7372c8be114dcf0c996f7434d1070f4f2c5041e31b563540a4601
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.mlp.up_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e55ea395d8289f0eca110af10ade357f78dc173c47d08de0fcc00d99053647b6
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab019d48452ee4d4a8a21cf9ce4745e353a32ed5211a8fb940686af51b37fec3
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab76bae749f7fdf73e7e0ba4dc8a069296c020a908e22abac92c289e0fd53cb8
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.o_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d61303189efdcb4fa12b236eb248d47fa7e6a9a5c5738ffd7499ab4028269681
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.o_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:473e53cd029fa4d1dde68354b5db90323840ce7d99e1db24288a03c5ebeb7160
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:390a32df2863a5397badd9681a66430911732f4ff837f27bfaca968bac6c7c4e
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:473e53cd029fa4d1dde68354b5db90323840ce7d99e1db24288a03c5ebeb7160
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4cb15394af6b8e63df97bbefe244b523b8ad8a63ad627f5178308c7de153b5f
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab76bae749f7fdf73e7e0ba4dc8a069296c020a908e22abac92c289e0fd53cb8
|
3 |
+
size 5187
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.11.mlp.down_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e1c2875e415433cc0cb692b8f33c04828985db052470365977bb056e993037c
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.11.mlp.down_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:473e53cd029fa4d1dde68354b5db90323840ce7d99e1db24288a03c5ebeb7160
|
3 |
+
size 17475
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.11.mlp.gate_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5731db3f4220b39207d55bbf7dfb482e49a96ced2048139bd81452856274acea
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.11.mlp.gate_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e55ea395d8289f0eca110af10ade357f78dc173c47d08de0fcc00d99053647b6
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.11.mlp.up_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f757832d4404094dcb42d94c8182022a36b689e0aa165cb3e0892bb59d3838ff
|
3 |
+
size 58435
|
params/llama3/8/norm_nlr/comb_4/init/model.layers.11.mlp.up_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e55ea395d8289f0eca110af10ade357f78dc173c47d08de0fcc00d99053647b6
|
3 |
+
size 58435
|