Diogo-V commited on
Commit
261a5bf
1 Parent(s): 78857e5

Upload learned parameters for llama3 in bit 4

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. params/llama3/4/fixed/woq/init/lm_head/scale.pt +3 -0
  2. params/llama3/4/fixed/woq/init/lm_head/zp.pt +3 -0
  3. params/llama3/4/fixed/woq/init/model.layers.0.mlp.down_proj/scale.pt +3 -0
  4. params/llama3/4/fixed/woq/init/model.layers.0.mlp.down_proj/zp.pt +3 -0
  5. params/llama3/4/fixed/woq/init/model.layers.0.mlp.gate_proj/scale.pt +3 -0
  6. params/llama3/4/fixed/woq/init/model.layers.0.mlp.gate_proj/zp.pt +3 -0
  7. params/llama3/4/fixed/woq/init/model.layers.0.mlp.up_proj/scale.pt +3 -0
  8. params/llama3/4/fixed/woq/init/model.layers.0.mlp.up_proj/zp.pt +3 -0
  9. params/llama3/4/fixed/woq/init/model.layers.0.self_attn.k_proj/scale.pt +3 -0
  10. params/llama3/4/fixed/woq/init/model.layers.0.self_attn.k_proj/zp.pt +3 -0
  11. params/llama3/4/fixed/woq/init/model.layers.0.self_attn.o_proj/scale.pt +3 -0
  12. params/llama3/4/fixed/woq/init/model.layers.0.self_attn.o_proj/zp.pt +3 -0
  13. params/llama3/4/fixed/woq/init/model.layers.0.self_attn.q_proj/scale.pt +3 -0
  14. params/llama3/4/fixed/woq/init/model.layers.0.self_attn.q_proj/zp.pt +3 -0
  15. params/llama3/4/fixed/woq/init/model.layers.0.self_attn.v_proj/scale.pt +3 -0
  16. params/llama3/4/fixed/woq/init/model.layers.0.self_attn.v_proj/zp.pt +3 -0
  17. params/llama3/4/fixed/woq/init/model.layers.1.mlp.down_proj/scale.pt +3 -0
  18. params/llama3/4/fixed/woq/init/model.layers.1.mlp.down_proj/zp.pt +3 -0
  19. params/llama3/4/fixed/woq/init/model.layers.1.mlp.gate_proj/scale.pt +3 -0
  20. params/llama3/4/fixed/woq/init/model.layers.1.mlp.gate_proj/zp.pt +3 -0
  21. params/llama3/4/fixed/woq/init/model.layers.1.mlp.up_proj/scale.pt +3 -0
  22. params/llama3/4/fixed/woq/init/model.layers.1.mlp.up_proj/zp.pt +3 -0
  23. params/llama3/4/fixed/woq/init/model.layers.1.self_attn.k_proj/scale.pt +3 -0
  24. params/llama3/4/fixed/woq/init/model.layers.1.self_attn.k_proj/zp.pt +3 -0
  25. params/llama3/4/fixed/woq/init/model.layers.1.self_attn.o_proj/scale.pt +3 -0
  26. params/llama3/4/fixed/woq/init/model.layers.1.self_attn.o_proj/zp.pt +3 -0
  27. params/llama3/4/fixed/woq/init/model.layers.1.self_attn.q_proj/scale.pt +3 -0
  28. params/llama3/4/fixed/woq/init/model.layers.1.self_attn.q_proj/zp.pt +3 -0
  29. params/llama3/4/fixed/woq/init/model.layers.1.self_attn.v_proj/scale.pt +3 -0
  30. params/llama3/4/fixed/woq/init/model.layers.1.self_attn.v_proj/zp.pt +3 -0
  31. params/llama3/4/fixed/woq/init/model.layers.10.mlp.down_proj/scale.pt +3 -0
  32. params/llama3/4/fixed/woq/init/model.layers.10.mlp.down_proj/zp.pt +3 -0
  33. params/llama3/4/fixed/woq/init/model.layers.10.mlp.gate_proj/scale.pt +3 -0
  34. params/llama3/4/fixed/woq/init/model.layers.10.mlp.gate_proj/zp.pt +3 -0
  35. params/llama3/4/fixed/woq/init/model.layers.10.mlp.up_proj/scale.pt +3 -0
  36. params/llama3/4/fixed/woq/init/model.layers.10.mlp.up_proj/zp.pt +3 -0
  37. params/llama3/4/fixed/woq/init/model.layers.10.self_attn.k_proj/scale.pt +3 -0
  38. params/llama3/4/fixed/woq/init/model.layers.10.self_attn.k_proj/zp.pt +3 -0
  39. params/llama3/4/fixed/woq/init/model.layers.10.self_attn.o_proj/scale.pt +3 -0
  40. params/llama3/4/fixed/woq/init/model.layers.10.self_attn.o_proj/zp.pt +3 -0
  41. params/llama3/4/fixed/woq/init/model.layers.10.self_attn.q_proj/scale.pt +3 -0
  42. params/llama3/4/fixed/woq/init/model.layers.10.self_attn.q_proj/zp.pt +3 -0
  43. params/llama3/4/fixed/woq/init/model.layers.10.self_attn.v_proj/scale.pt +3 -0
  44. params/llama3/4/fixed/woq/init/model.layers.10.self_attn.v_proj/zp.pt +3 -0
  45. params/llama3/4/fixed/woq/init/model.layers.11.mlp.down_proj/scale.pt +3 -0
  46. params/llama3/4/fixed/woq/init/model.layers.11.mlp.down_proj/zp.pt +3 -0
  47. params/llama3/4/fixed/woq/init/model.layers.11.mlp.gate_proj/scale.pt +3 -0
  48. params/llama3/4/fixed/woq/init/model.layers.11.mlp.gate_proj/zp.pt +3 -0
  49. params/llama3/4/fixed/woq/init/model.layers.11.mlp.up_proj/scale.pt +3 -0
  50. params/llama3/4/fixed/woq/init/model.layers.11.mlp.up_proj/zp.pt +3 -0
params/llama3/4/fixed/woq/init/lm_head/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1deabb894696143cd8c206ba4d69b7b5a9d6cb8af1f4725b8cc1f5fb0f8657e0
3
+ size 514130
params/llama3/4/fixed/woq/init/lm_head/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.0.mlp.down_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5659b3434837424e419858356b0f534e08584612132ffe0420f4c320873bb2b
3
+ size 17490
params/llama3/4/fixed/woq/init/model.layers.0.mlp.down_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.0.mlp.gate_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e711d95c78cfdb13514f6bb97538b1d66bbde4a68082f9223f524fb1812f0bf2
3
+ size 58450
params/llama3/4/fixed/woq/init/model.layers.0.mlp.gate_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.0.mlp.up_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89ab767fe824fab198fc1d7297418f8dcac6d965679ab44fd7ea08e1352ad930
3
+ size 58450
params/llama3/4/fixed/woq/init/model.layers.0.mlp.up_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.0.self_attn.k_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:093e6f016caf10b4662a63e403633dec97ff335dc9d861dd92593e5e921e42f3
3
+ size 5202
params/llama3/4/fixed/woq/init/model.layers.0.self_attn.k_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.0.self_attn.o_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a415b289c6171e58fd5bb9d2b357d0da5616e29dd2a06a3e913c46d3934b3ed3
3
+ size 17490
params/llama3/4/fixed/woq/init/model.layers.0.self_attn.o_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.0.self_attn.q_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:070f116ff9ca39d20167c33aefb08e38cda23f2641ce5e92a1fda0db1a233976
3
+ size 17490
params/llama3/4/fixed/woq/init/model.layers.0.self_attn.q_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.0.self_attn.v_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a34fb62f40b1f0ef0b51247755e732ffe4914957319006bbc5c1863ffaa51b6
3
+ size 5202
params/llama3/4/fixed/woq/init/model.layers.0.self_attn.v_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.1.mlp.down_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4db4f775e92abbe1698a478da4e58d60a21647984fcae2a61f1432d027e2ec14
3
+ size 17490
params/llama3/4/fixed/woq/init/model.layers.1.mlp.down_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.1.mlp.gate_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dbb69dc3091eb2bb25477d691bba2348b8815a5ef0d0555656a611c8a10d308
3
+ size 58450
params/llama3/4/fixed/woq/init/model.layers.1.mlp.gate_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.1.mlp.up_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a0de69e533dc8e888d9fea135552f3e295393eb2df6b064cb60e4897b7b9e17
3
+ size 58450
params/llama3/4/fixed/woq/init/model.layers.1.mlp.up_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.1.self_attn.k_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66b077baccf6bf86abc96668a0a6ff8c98ecbf20fbbf898cb0ef48d016d8304b
3
+ size 5202
params/llama3/4/fixed/woq/init/model.layers.1.self_attn.k_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.1.self_attn.o_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aafc7efd74a7d54feddcab756051c99ef5b9ae4eff76ac3da6f663375999c740
3
+ size 17490
params/llama3/4/fixed/woq/init/model.layers.1.self_attn.o_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.1.self_attn.q_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6d5c0673b20e757891db34695b0138fbeca28f21c80424ae36efe42206d3dae
3
+ size 17490
params/llama3/4/fixed/woq/init/model.layers.1.self_attn.q_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.1.self_attn.v_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8262690d13c6be1d4058cf5b4f300ebdbee6f3b7fc6f33914298a0309f2b2a3b
3
+ size 5202
params/llama3/4/fixed/woq/init/model.layers.1.self_attn.v_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.10.mlp.down_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d44e723ab9d9d935a5eaec0bda8590a51fe422179b5b8d243149ac04bbbb676c
3
+ size 17490
params/llama3/4/fixed/woq/init/model.layers.10.mlp.down_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.10.mlp.gate_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7749a3abadc83fede08794fdf41282a8b03ed4f6d1a35d6882cf736ff61145e
3
+ size 58450
params/llama3/4/fixed/woq/init/model.layers.10.mlp.gate_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.10.mlp.up_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7904a7821505036283274bdcbc4a396e6c09475c7f9e6c7bea12ffc3dcdeaaca
3
+ size 58450
params/llama3/4/fixed/woq/init/model.layers.10.mlp.up_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.10.self_attn.k_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b5a403caf36c83b92327ff6ae6164c70128fa73ad5a05ec879216a871892710
3
+ size 5202
params/llama3/4/fixed/woq/init/model.layers.10.self_attn.k_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.10.self_attn.o_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92a1e9116474a9afe8cb882e0e241207f070f311b8302605f18a8901bad76b22
3
+ size 17490
params/llama3/4/fixed/woq/init/model.layers.10.self_attn.o_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.10.self_attn.q_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:668332d89c8d9f7871c26d29f18906e189b19421c165cd02755017a0d2a12ffa
3
+ size 17490
params/llama3/4/fixed/woq/init/model.layers.10.self_attn.q_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.10.self_attn.v_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c42042b1aef9a184fe97fc56f9d4a9f4995ed50dcfd6239d760c54234a5d096
3
+ size 5202
params/llama3/4/fixed/woq/init/model.layers.10.self_attn.v_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.11.mlp.down_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56c18841e47ae62273d4ca991958ab9bf67d61b4e67e658658290eeece9a9a68
3
+ size 17490
params/llama3/4/fixed/woq/init/model.layers.11.mlp.down_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.11.mlp.gate_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81976d4f6186d570f351a57ec581daa73c70a96ae615a8040c9b55209da31ccc
3
+ size 58450
params/llama3/4/fixed/woq/init/model.layers.11.mlp.gate_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/4/fixed/woq/init/model.layers.11.mlp.up_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d4f022bbfa51a79908e138b3d25f2d9732398bb3220c80b3a79e4de41e245ce
3
+ size 58450
params/llama3/4/fixed/woq/init/model.layers.11.mlp.up_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091