Upload folder using huggingface_hub

Browse files

Files changed (5) hide show

onnx/decoder_model_merged.onnx +1 -1
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +54 -54

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2e16283f568a32bd8e9f8716e21a5af318e6ba5438b82d76a13265a4661494fc
 size 1415934308

 version https://git-lfs.github.com/spec/v1
+oid sha256:f38588d4238680348dbb1c16c15d2bd2a3e7fc219990b9070c957616ae9ebc9f
 size 1415934308

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:95fdbeec3fc8c6116c41b2153af4de72ca014a3466fa24b1edbf8904af9bae39
-size 356700610

 version https://git-lfs.github.com/spec/v1
+oid sha256:d5cf4e5190f545d935d86d09be9f9f66fd2912f1f4ea5571e5d67139b83247db
+size 355594162

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:54baba9918925344934e39d5ccc30d10bba3da938240fed4a09e072c6323549d
-size 355819455

 version https://git-lfs.github.com/spec/v1
+oid sha256:a6177582b8d5a031910420394a9d05ae0c592bf42df68014731d35048eed2255
+size 354713007

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1b26ef4475e8a6e5fff3fc6c76ca1a3fc84b7fff75734969f52c83055ce2ff5d
-size 355820242

 version https://git-lfs.github.com/spec/v1
+oid sha256:dba993ac31348a0b6dc7567776cb1850bb020a818db5d34013b3a237df6ce56e
+size 354713794

quantize_config.json CHANGED Viewed

@@ -1,100 +1,100 @@
 {
-    "per_channel": true,
-    "reduce_range": true,
     "per_model_config": {
         "decoder_model": {
             "op_types": [
-                "Or",
                 "Pow",
-                "ConstantOfShape",
                 "Mul",
                 "Slice",
                 "Transpose",
-                "Erf",
                 "MatMul",
-                "Cast",
                 "Constant",
                 "ScatterND",
-                "Sub",
-                "Unsqueeze",
-                "Range",
-                "Add",
-                "Equal",
-                "Concat",
-                "ReduceMean",
-                "Where",
-                "Less",
-                "Div",
                 "Expand",
                 "Reshape",
-                "Not",
-                "Shape",
-                "Gather",
                 "Sqrt",
-                "Softmax"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
-                "Or",
                 "Pow",
-                "ConstantOfShape",
                 "Mul",
                 "Slice",
                 "Transpose",
-                "Erf",
                 "MatMul",
-                "Cast",
                 "Constant",
                 "ScatterND",
-                "Sub",
-                "Unsqueeze",
-                "Range",
-                "Add",
-                "Equal",
-                "Concat",
-                "ReduceMean",
-                "Where",
-                "Less",
-                "Div",
                 "Expand",
                 "Reshape",
-                "Not",
-                "Shape",
                 "If",
-                "Gather",
                 "Sqrt",
-                "Softmax"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
                 "Pow",
-                "ConstantOfShape",
                 "Mul",
                 "Slice",
                 "Transpose",
-                "Erf",
                 "MatMul",
-                "Cast",
                 "Constant",
-                "Sub",
-                "Unsqueeze",
-                "Add",
-                "Equal",
-                "Concat",
-                "ReduceMean",
-                "Where",
-                "Div",
-                "Reshape",
                 "Expand",
-                "Not",
-                "Shape",
-                "Gather",
                 "Sqrt",
-                "Softmax"
             ],
             "weight_type": "QInt8"
         }

 {
+    "per_channel": false,
+    "reduce_range": false,
     "per_model_config": {
         "decoder_model": {
             "op_types": [
+                "Cast",
+                "Sub",
+                "Div",
+                "ReduceMean",
                 "Pow",
+                "Erf",
+                "Gather",
+                "Less",
+                "Add",
+                "Where",
+                "Equal",
                 "Mul",
+                "Or",
                 "Slice",
+                "Range",
+                "ConstantOfShape",
                 "Transpose",
                 "MatMul",
+                "Softmax",
+                "Not",
                 "Constant",
                 "ScatterND",
                 "Expand",
                 "Reshape",
                 "Sqrt",
+                "Unsqueeze",
+                "Concat",
+                "Shape"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
+                "Cast",
+                "Sub",
+                "Div",
+                "ReduceMean",
                 "Pow",
+                "Erf",
+                "Gather",
+                "Less",
+                "Add",
+                "Where",
+                "Equal",
                 "Mul",
                 "Slice",
+                "Or",
+                "Range",
+                "ConstantOfShape",
                 "Transpose",
                 "MatMul",
+                "Softmax",
+                "Not",
                 "Constant",
                 "ScatterND",
                 "Expand",
                 "Reshape",
                 "If",
                 "Sqrt",
+                "Unsqueeze",
+                "Concat",
+                "Shape"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Div",
+                "Cast",
+                "Sub",
                 "Pow",
+                "ReduceMean",
+                "Erf",
+                "Gather",
+                "Add",
+                "Where",
+                "Equal",
                 "Mul",
                 "Slice",
+                "ConstantOfShape",
                 "Transpose",
                 "MatMul",
+                "Softmax",
+                "Not",
                 "Constant",
                 "Expand",
+                "Reshape",
                 "Sqrt",
+                "Unsqueeze",
+                "Concat",
+                "Shape"
             ],
             "weight_type": "QInt8"
         }