Diogo-V commited on
Commit
6538ff5
1 Parent(s): 758e9f1

Upload learned parameters for llama3 in bit 5

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. params/llama3/5/fixed/woq/init/lm_head/scale.pt +3 -0
  2. params/llama3/5/fixed/woq/init/lm_head/zp.pt +3 -0
  3. params/llama3/5/fixed/woq/init/model.layers.0.mlp.down_proj/scale.pt +3 -0
  4. params/llama3/5/fixed/woq/init/model.layers.0.mlp.down_proj/zp.pt +3 -0
  5. params/llama3/5/fixed/woq/init/model.layers.0.mlp.gate_proj/scale.pt +3 -0
  6. params/llama3/5/fixed/woq/init/model.layers.0.mlp.gate_proj/zp.pt +3 -0
  7. params/llama3/5/fixed/woq/init/model.layers.0.mlp.up_proj/scale.pt +3 -0
  8. params/llama3/5/fixed/woq/init/model.layers.0.mlp.up_proj/zp.pt +3 -0
  9. params/llama3/5/fixed/woq/init/model.layers.0.self_attn.k_proj/scale.pt +3 -0
  10. params/llama3/5/fixed/woq/init/model.layers.0.self_attn.k_proj/zp.pt +3 -0
  11. params/llama3/5/fixed/woq/init/model.layers.0.self_attn.o_proj/scale.pt +3 -0
  12. params/llama3/5/fixed/woq/init/model.layers.0.self_attn.o_proj/zp.pt +3 -0
  13. params/llama3/5/fixed/woq/init/model.layers.0.self_attn.q_proj/scale.pt +3 -0
  14. params/llama3/5/fixed/woq/init/model.layers.0.self_attn.q_proj/zp.pt +3 -0
  15. params/llama3/5/fixed/woq/init/model.layers.0.self_attn.v_proj/scale.pt +3 -0
  16. params/llama3/5/fixed/woq/init/model.layers.0.self_attn.v_proj/zp.pt +3 -0
  17. params/llama3/5/fixed/woq/init/model.layers.1.mlp.down_proj/scale.pt +3 -0
  18. params/llama3/5/fixed/woq/init/model.layers.1.mlp.down_proj/zp.pt +3 -0
  19. params/llama3/5/fixed/woq/init/model.layers.1.mlp.gate_proj/scale.pt +3 -0
  20. params/llama3/5/fixed/woq/init/model.layers.1.mlp.gate_proj/zp.pt +3 -0
  21. params/llama3/5/fixed/woq/init/model.layers.1.mlp.up_proj/scale.pt +3 -0
  22. params/llama3/5/fixed/woq/init/model.layers.1.mlp.up_proj/zp.pt +3 -0
  23. params/llama3/5/fixed/woq/init/model.layers.1.self_attn.k_proj/scale.pt +3 -0
  24. params/llama3/5/fixed/woq/init/model.layers.1.self_attn.k_proj/zp.pt +3 -0
  25. params/llama3/5/fixed/woq/init/model.layers.1.self_attn.o_proj/scale.pt +3 -0
  26. params/llama3/5/fixed/woq/init/model.layers.1.self_attn.o_proj/zp.pt +3 -0
  27. params/llama3/5/fixed/woq/init/model.layers.1.self_attn.q_proj/scale.pt +3 -0
  28. params/llama3/5/fixed/woq/init/model.layers.1.self_attn.q_proj/zp.pt +3 -0
  29. params/llama3/5/fixed/woq/init/model.layers.1.self_attn.v_proj/scale.pt +3 -0
  30. params/llama3/5/fixed/woq/init/model.layers.1.self_attn.v_proj/zp.pt +3 -0
  31. params/llama3/5/fixed/woq/init/model.layers.10.mlp.down_proj/scale.pt +3 -0
  32. params/llama3/5/fixed/woq/init/model.layers.10.mlp.down_proj/zp.pt +3 -0
  33. params/llama3/5/fixed/woq/init/model.layers.10.mlp.gate_proj/scale.pt +3 -0
  34. params/llama3/5/fixed/woq/init/model.layers.10.mlp.gate_proj/zp.pt +3 -0
  35. params/llama3/5/fixed/woq/init/model.layers.10.mlp.up_proj/scale.pt +3 -0
  36. params/llama3/5/fixed/woq/init/model.layers.10.mlp.up_proj/zp.pt +3 -0
  37. params/llama3/5/fixed/woq/init/model.layers.10.self_attn.k_proj/scale.pt +3 -0
  38. params/llama3/5/fixed/woq/init/model.layers.10.self_attn.k_proj/zp.pt +3 -0
  39. params/llama3/5/fixed/woq/init/model.layers.10.self_attn.o_proj/scale.pt +3 -0
  40. params/llama3/5/fixed/woq/init/model.layers.10.self_attn.o_proj/zp.pt +3 -0
  41. params/llama3/5/fixed/woq/init/model.layers.10.self_attn.q_proj/scale.pt +3 -0
  42. params/llama3/5/fixed/woq/init/model.layers.10.self_attn.q_proj/zp.pt +3 -0
  43. params/llama3/5/fixed/woq/init/model.layers.10.self_attn.v_proj/scale.pt +3 -0
  44. params/llama3/5/fixed/woq/init/model.layers.10.self_attn.v_proj/zp.pt +3 -0
  45. params/llama3/5/fixed/woq/init/model.layers.11.mlp.down_proj/scale.pt +3 -0
  46. params/llama3/5/fixed/woq/init/model.layers.11.mlp.down_proj/zp.pt +3 -0
  47. params/llama3/5/fixed/woq/init/model.layers.11.mlp.gate_proj/scale.pt +3 -0
  48. params/llama3/5/fixed/woq/init/model.layers.11.mlp.gate_proj/zp.pt +3 -0
  49. params/llama3/5/fixed/woq/init/model.layers.11.mlp.up_proj/scale.pt +3 -0
  50. params/llama3/5/fixed/woq/init/model.layers.11.mlp.up_proj/zp.pt +3 -0
params/llama3/5/fixed/woq/init/lm_head/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fd9133b6d33e965ac253e645ba78a1847accebb56b960ccde6535eb2a862e89
3
+ size 514130
params/llama3/5/fixed/woq/init/lm_head/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.0.mlp.down_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:600dca7cd51ab240c1a4855ddf93391ed2490df8ff13ce073c63f8edc29455f9
3
+ size 17490
params/llama3/5/fixed/woq/init/model.layers.0.mlp.down_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.0.mlp.gate_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1745bd8b4dc422427fc7d30584c1128e925776fab4de1e2f5623c6124442e920
3
+ size 58450
params/llama3/5/fixed/woq/init/model.layers.0.mlp.gate_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.0.mlp.up_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa5cb81e8537d798bf470111ffa2d96f05881c018cc82951e89ff12254f85e32
3
+ size 58450
params/llama3/5/fixed/woq/init/model.layers.0.mlp.up_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.0.self_attn.k_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab433d59b9a8d5f20916e5d58b4d885ad065020b568bdd239a79b38caf527e77
3
+ size 5202
params/llama3/5/fixed/woq/init/model.layers.0.self_attn.k_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.0.self_attn.o_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3762f047edf8a49bc03ff0e401722eea69be7519488fcf612ee0fc73414b082c
3
+ size 17490
params/llama3/5/fixed/woq/init/model.layers.0.self_attn.o_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.0.self_attn.q_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54a9c7d94ce007ed841ceced457cc565a8aadd8979e6c69c499559aa1373e1e4
3
+ size 17490
params/llama3/5/fixed/woq/init/model.layers.0.self_attn.q_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.0.self_attn.v_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b6cbdc840657a0a25634b511a92a658144c1b9b7b16424eaecbc2c3290aed5
3
+ size 5202
params/llama3/5/fixed/woq/init/model.layers.0.self_attn.v_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.1.mlp.down_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a884ba8050f6d03d675614108cf48b8fe6ae77f7d5b493dc7e80b671ba55bdd0
3
+ size 17490
params/llama3/5/fixed/woq/init/model.layers.1.mlp.down_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.1.mlp.gate_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a4490c9e67d81c75d09e6b75f62d5f8691c03ec6bc290d2573698c23074ff6c
3
+ size 58450
params/llama3/5/fixed/woq/init/model.layers.1.mlp.gate_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.1.mlp.up_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b3e9fceec3aef03beaae884389a2a7281850d5a350a03a71ae9765d07666ed6
3
+ size 58450
params/llama3/5/fixed/woq/init/model.layers.1.mlp.up_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.1.self_attn.k_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7aa06a6437d5458c68e1583929d4215c474608d56878c33dc1439d824e6f24ba
3
+ size 5202
params/llama3/5/fixed/woq/init/model.layers.1.self_attn.k_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.1.self_attn.o_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50ace75a5f2c1c2959047bb1741152efd6a891c767c14f23a35c53e9be03a7b3
3
+ size 17490
params/llama3/5/fixed/woq/init/model.layers.1.self_attn.o_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.1.self_attn.q_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34e121a5d40f235a577584a86e6a799e1d8ee84fd7e2cef60e423b64a37b4561
3
+ size 17490
params/llama3/5/fixed/woq/init/model.layers.1.self_attn.q_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.1.self_attn.v_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d86ab37c27e1497c42876286bc2fe81d378a836f7c2a55796533d9a523a7f171
3
+ size 5202
params/llama3/5/fixed/woq/init/model.layers.1.self_attn.v_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.10.mlp.down_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38f85be9b07b24bd67cf92d46ff025ec156f0879b9b15441a267c4342776f18b
3
+ size 17490
params/llama3/5/fixed/woq/init/model.layers.10.mlp.down_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.10.mlp.gate_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd1bb96d68d8a3f5f6d597218cd6a2d5146e1edf16e01c1cf939d80ec8120152
3
+ size 58450
params/llama3/5/fixed/woq/init/model.layers.10.mlp.gate_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.10.mlp.up_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:187652a19ab1facd9c1b5bbe0f3dd0c4a9d57d962948a1f97e86f50f8a8efabd
3
+ size 58450
params/llama3/5/fixed/woq/init/model.layers.10.mlp.up_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.10.self_attn.k_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56cdff794d522e35186cdd38b449cb869b94388bebe83f8b99613c1e29c7435d
3
+ size 5202
params/llama3/5/fixed/woq/init/model.layers.10.self_attn.k_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.10.self_attn.o_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:409ae09052c23c1f7511b277e1a552162f2e3be8dd7db0e8d51dfdff8aff08c3
3
+ size 17490
params/llama3/5/fixed/woq/init/model.layers.10.self_attn.o_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.10.self_attn.q_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e7dee5f6def6b5f46471d13136f846069c597c846ea6e0fdeeb4ece061148ea
3
+ size 17490
params/llama3/5/fixed/woq/init/model.layers.10.self_attn.q_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.10.self_attn.v_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07bd5e2dd8cde7090a76a749a1e00da43ccff3f92eda1efba366cfebee52269f
3
+ size 5202
params/llama3/5/fixed/woq/init/model.layers.10.self_attn.v_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.11.mlp.down_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f95034676422b923b30402c279b09058184b1edd7fb528a46de42404a9e348d
3
+ size 17490
params/llama3/5/fixed/woq/init/model.layers.11.mlp.down_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.11.mlp.gate_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08e37e86ac63009f0a0ff14234a7892165824fd18b535f6033fbd8493352661d
3
+ size 58450
params/llama3/5/fixed/woq/init/model.layers.11.mlp.gate_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/5/fixed/woq/init/model.layers.11.mlp.up_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4963fd4cac1b1a761a0e4fb8ad7f39d2d5d10ffd85f38cf74ddeb597d042676c
3
+ size 58450
params/llama3/5/fixed/woq/init/model.layers.11.mlp.up_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091