Upload 8 files

by Xenova HF staff - opened Mar 20

base: refs/heads/main

←

from: refs/pr/1

Discussion Files changed

+102

-0

Files changed (6) hide show

onnx/model_bnb4.onnx +3 -0
onnx/model_int8.onnx +3 -0
onnx/model_q4.onnx +3 -0
onnx/model_quantized.onnx +3 -0
onnx/model_uint8.onnx +3 -0
quantize_config.json +87 -0

onnx/model_bnb4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dbb834378afbc7d0f00fda65861e06cc1af85730f68b596a66f2aa068d4b1124
+size 17963874

onnx/model_int8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a40ba6ecc73f01ecf139d871ffe936f5aa2af3a3316765a3dea6608c7a5764e0
+size 4715295

onnx/model_q4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dbb834378afbc7d0f00fda65861e06cc1af85730f68b596a66f2aa068d4b1124
+size 17963874

onnx/model_quantized.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fb5007aef59fd63101e45ffe5bed76ca7e1f2d1fe638b5de29b50235f629f323
+size 4715295

onnx/model_uint8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fb5007aef59fd63101e45ffe5bed76ca7e1f2d1fe638b5de29b50235f629f323
+size 4715295

quantize_config.json ADDED Viewed

	@@ -0,0 +1,87 @@

+{
+    "fp16": {},
+    "q8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Gather",
+                    "LeakyRelu",
+                    "Mul",
+                    "Reshape",
+                    "Resize",
+                    "Shape",
+                    "Transpose",
+                    "Unsqueeze"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": true,
+        "reduce_range": true
+    },
+    "int8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Gather",
+                    "LeakyRelu",
+                    "Mul",
+                    "Reshape",
+                    "Resize",
+                    "Shape",
+                    "Transpose",
+                    "Unsqueeze"
+                ],
+                "weight_type": "QInt8"
+            }
+        },
+        "per_channel": true,
+        "reduce_range": true
+    },
+    "uint8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Gather",
+                    "LeakyRelu",
+                    "Mul",
+                    "Reshape",
+                    "Resize",
+                    "Shape",
+                    "Transpose",
+                    "Unsqueeze"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": true,
+        "reduce_range": true
+    },
+    "q4": {
+        "block_size": 32,
+        "is_symmetric": true,
+        "accuracy_level": null
+    },
+    "bnb4": {
+        "block_size": 64,
+        "quant_type": 1
+    }
+}