Diogo-V commited on
Commit
e8668fe
1 Parent(s): 7591243

Upload learned parameters for llama3 in bit 7

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. params/llama3/7/fixed/woq/init/lm_head/scale.pt +3 -0
  2. params/llama3/7/fixed/woq/init/lm_head/zp.pt +3 -0
  3. params/llama3/7/fixed/woq/init/model.layers.0.mlp.down_proj/scale.pt +3 -0
  4. params/llama3/7/fixed/woq/init/model.layers.0.mlp.down_proj/zp.pt +3 -0
  5. params/llama3/7/fixed/woq/init/model.layers.0.mlp.gate_proj/scale.pt +3 -0
  6. params/llama3/7/fixed/woq/init/model.layers.0.mlp.gate_proj/zp.pt +3 -0
  7. params/llama3/7/fixed/woq/init/model.layers.0.mlp.up_proj/scale.pt +3 -0
  8. params/llama3/7/fixed/woq/init/model.layers.0.mlp.up_proj/zp.pt +3 -0
  9. params/llama3/7/fixed/woq/init/model.layers.0.self_attn.k_proj/scale.pt +3 -0
  10. params/llama3/7/fixed/woq/init/model.layers.0.self_attn.k_proj/zp.pt +3 -0
  11. params/llama3/7/fixed/woq/init/model.layers.0.self_attn.o_proj/scale.pt +3 -0
  12. params/llama3/7/fixed/woq/init/model.layers.0.self_attn.o_proj/zp.pt +3 -0
  13. params/llama3/7/fixed/woq/init/model.layers.0.self_attn.q_proj/scale.pt +3 -0
  14. params/llama3/7/fixed/woq/init/model.layers.0.self_attn.q_proj/zp.pt +3 -0
  15. params/llama3/7/fixed/woq/init/model.layers.0.self_attn.v_proj/scale.pt +3 -0
  16. params/llama3/7/fixed/woq/init/model.layers.0.self_attn.v_proj/zp.pt +3 -0
  17. params/llama3/7/fixed/woq/init/model.layers.1.mlp.down_proj/scale.pt +3 -0
  18. params/llama3/7/fixed/woq/init/model.layers.1.mlp.down_proj/zp.pt +3 -0
  19. params/llama3/7/fixed/woq/init/model.layers.1.mlp.gate_proj/scale.pt +3 -0
  20. params/llama3/7/fixed/woq/init/model.layers.1.mlp.gate_proj/zp.pt +3 -0
  21. params/llama3/7/fixed/woq/init/model.layers.1.mlp.up_proj/scale.pt +3 -0
  22. params/llama3/7/fixed/woq/init/model.layers.1.mlp.up_proj/zp.pt +3 -0
  23. params/llama3/7/fixed/woq/init/model.layers.1.self_attn.k_proj/scale.pt +3 -0
  24. params/llama3/7/fixed/woq/init/model.layers.1.self_attn.k_proj/zp.pt +3 -0
  25. params/llama3/7/fixed/woq/init/model.layers.1.self_attn.o_proj/scale.pt +3 -0
  26. params/llama3/7/fixed/woq/init/model.layers.1.self_attn.o_proj/zp.pt +3 -0
  27. params/llama3/7/fixed/woq/init/model.layers.1.self_attn.q_proj/scale.pt +3 -0
  28. params/llama3/7/fixed/woq/init/model.layers.1.self_attn.q_proj/zp.pt +3 -0
  29. params/llama3/7/fixed/woq/init/model.layers.1.self_attn.v_proj/scale.pt +3 -0
  30. params/llama3/7/fixed/woq/init/model.layers.1.self_attn.v_proj/zp.pt +3 -0
  31. params/llama3/7/fixed/woq/init/model.layers.10.mlp.down_proj/scale.pt +3 -0
  32. params/llama3/7/fixed/woq/init/model.layers.10.mlp.down_proj/zp.pt +3 -0
  33. params/llama3/7/fixed/woq/init/model.layers.10.mlp.gate_proj/scale.pt +3 -0
  34. params/llama3/7/fixed/woq/init/model.layers.10.mlp.gate_proj/zp.pt +3 -0
  35. params/llama3/7/fixed/woq/init/model.layers.10.mlp.up_proj/scale.pt +3 -0
  36. params/llama3/7/fixed/woq/init/model.layers.10.mlp.up_proj/zp.pt +3 -0
  37. params/llama3/7/fixed/woq/init/model.layers.10.self_attn.k_proj/scale.pt +3 -0
  38. params/llama3/7/fixed/woq/init/model.layers.10.self_attn.k_proj/zp.pt +3 -0
  39. params/llama3/7/fixed/woq/init/model.layers.10.self_attn.o_proj/scale.pt +3 -0
  40. params/llama3/7/fixed/woq/init/model.layers.10.self_attn.o_proj/zp.pt +3 -0
  41. params/llama3/7/fixed/woq/init/model.layers.10.self_attn.q_proj/scale.pt +3 -0
  42. params/llama3/7/fixed/woq/init/model.layers.10.self_attn.q_proj/zp.pt +3 -0
  43. params/llama3/7/fixed/woq/init/model.layers.10.self_attn.v_proj/scale.pt +3 -0
  44. params/llama3/7/fixed/woq/init/model.layers.10.self_attn.v_proj/zp.pt +3 -0
  45. params/llama3/7/fixed/woq/init/model.layers.11.mlp.down_proj/scale.pt +3 -0
  46. params/llama3/7/fixed/woq/init/model.layers.11.mlp.down_proj/zp.pt +3 -0
  47. params/llama3/7/fixed/woq/init/model.layers.11.mlp.gate_proj/scale.pt +3 -0
  48. params/llama3/7/fixed/woq/init/model.layers.11.mlp.gate_proj/zp.pt +3 -0
  49. params/llama3/7/fixed/woq/init/model.layers.11.mlp.up_proj/scale.pt +3 -0
  50. params/llama3/7/fixed/woq/init/model.layers.11.mlp.up_proj/zp.pt +3 -0
params/llama3/7/fixed/woq/init/lm_head/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99a4cc4c882cfa55daacd5728682e890bfc30fff2a2c794fda264691ef699569
3
+ size 514130
params/llama3/7/fixed/woq/init/lm_head/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.0.mlp.down_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7d84257c9954c56ab2923eb580a37f399cfd7fb677e23bf999141a517390c90
3
+ size 17490
params/llama3/7/fixed/woq/init/model.layers.0.mlp.down_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.0.mlp.gate_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b2172fa3aa0d0bb903392e9ee35ec076a710724ead2bb8f8fd80867eb055b5a
3
+ size 58450
params/llama3/7/fixed/woq/init/model.layers.0.mlp.gate_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.0.mlp.up_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:216db9918b803c3592049eb151ed6c42da3c400f3089d2f23008b8c894860f54
3
+ size 58450
params/llama3/7/fixed/woq/init/model.layers.0.mlp.up_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.0.self_attn.k_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9fe260fec2815e8259bc015caf49dbc4df54de8ceff200ba71bdefa06fbbcc0
3
+ size 5202
params/llama3/7/fixed/woq/init/model.layers.0.self_attn.k_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.0.self_attn.o_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35910020ad7f431f2d69685d8fa3cccf0adf6070290359bd616a61c9b6b94e1d
3
+ size 17490
params/llama3/7/fixed/woq/init/model.layers.0.self_attn.o_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.0.self_attn.q_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d9e966938a5b6d7d0e30191d5d34e517805079ab377685e90548a9abdfd7d81
3
+ size 17490
params/llama3/7/fixed/woq/init/model.layers.0.self_attn.q_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.0.self_attn.v_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02c55446bb5903a74fe16136221d97c75450d1aa12539414638178a3db1a1459
3
+ size 5202
params/llama3/7/fixed/woq/init/model.layers.0.self_attn.v_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.1.mlp.down_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbbd55fe90635fb45c0e69b5736f22c129755ebe0a69b4976cf2d132e854ef92
3
+ size 17490
params/llama3/7/fixed/woq/init/model.layers.1.mlp.down_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.1.mlp.gate_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2a23e20305ba5c50fdd3081f8699f625383c1696e37aa629163971fd13f07cb
3
+ size 58450
params/llama3/7/fixed/woq/init/model.layers.1.mlp.gate_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.1.mlp.up_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e99cd225b11ab8d75faa4d2623a56c7f0a884a18b67b041702394470230efdb2
3
+ size 58450
params/llama3/7/fixed/woq/init/model.layers.1.mlp.up_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.1.self_attn.k_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:687e0a8d94d90f0c44a08653ef10a1b857b222f6725e28789a7c24f61f498507
3
+ size 5202
params/llama3/7/fixed/woq/init/model.layers.1.self_attn.k_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.1.self_attn.o_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56051896703f9674543c4a97b0a59cdf31974505831974cf3c46d8fff04aa090
3
+ size 17490
params/llama3/7/fixed/woq/init/model.layers.1.self_attn.o_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.1.self_attn.q_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd2ad0e367277f4daf4f829d4acbc39653daea35b83df3f1a21d5bab57b5f7e2
3
+ size 17490
params/llama3/7/fixed/woq/init/model.layers.1.self_attn.q_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.1.self_attn.v_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a0e8f5fa146d79a0cb004fdb6f5dadcb1cbb624504de262753cb4353c72d257
3
+ size 5202
params/llama3/7/fixed/woq/init/model.layers.1.self_attn.v_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.10.mlp.down_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0eb66170ecd3dd80f15b00c75159bdbd61b1d9057b2eca340fc8f00f0f463a3f
3
+ size 17490
params/llama3/7/fixed/woq/init/model.layers.10.mlp.down_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.10.mlp.gate_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83fa202e8e3e92aa1a0e5eebc853704539f50730c5be0274375bc5eeb58ee4ff
3
+ size 58450
params/llama3/7/fixed/woq/init/model.layers.10.mlp.gate_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.10.mlp.up_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8e49bbd1a7bba9bdb6eb35b356918c343ab3a70b8be845eda33b423aecb535d
3
+ size 58450
params/llama3/7/fixed/woq/init/model.layers.10.mlp.up_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.10.self_attn.k_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b3cf66307a1d752c142fcdb9603b7c21fd99476e457df5e12748764631d9582
3
+ size 5202
params/llama3/7/fixed/woq/init/model.layers.10.self_attn.k_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.10.self_attn.o_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cbd421bbdfab1af34166042010d2075551e61cd4b9e2ac8c0977e3d1a1aa9cd
3
+ size 17490
params/llama3/7/fixed/woq/init/model.layers.10.self_attn.o_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.10.self_attn.q_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70bf0e25aa3cc03b976d05379e4fdd91a092f2eade24e017eb07c2519d5e6fe2
3
+ size 17490
params/llama3/7/fixed/woq/init/model.layers.10.self_attn.q_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.10.self_attn.v_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4edf40e8b33fa21b174fed3c03e1aa42f0f5076bd4be22dc0e3dcd86ae02dcc1
3
+ size 5202
params/llama3/7/fixed/woq/init/model.layers.10.self_attn.v_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.11.mlp.down_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76d05bc2ed4440e12f1deb47817c95b592fd60f3e5c2935fea202034afa5acfa
3
+ size 17490
params/llama3/7/fixed/woq/init/model.layers.11.mlp.down_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.11.mlp.gate_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:780ce3dd5de790e6855e653f005f34ef5108658e0509d8b8e16887193a814c72
3
+ size 58450
params/llama3/7/fixed/woq/init/model.layers.11.mlp.gate_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091
params/llama3/7/fixed/woq/init/model.layers.11.mlp.up_proj/scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb04c1576fcecb0f197b38ab95dbea98b99696f0274fd7c2f79725c1da9fdca6
3
+ size 58450
params/llama3/7/fixed/woq/init/model.layers.11.mlp.up_proj/zp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74cbd027a8e6a7253e3ee35cfc1ea4eabe7d830e85cc2a975144d18821839da
3
+ size 1091