Upload folder using huggingface_hub

Browse files

Files changed (5) hide show

onnx/decoder_model_merged.onnx +1 -1
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +57 -57

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:55fbbfbdd774d0f4cc2a92f59f11e58584539d3a92dfb6536f65d4d3c1c4f57a
 size 791453859

 version https://git-lfs.github.com/spec/v1
+oid sha256:85b04628082c655fe5a8cfee14893b0f03cc3e662d5352320aa401fe75aafc15
 size 791453859

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4699d4bb1950bb65f77e2f6ce1b26a51f26fdb5813e22581efcf0c40fd8b95b4
-size 300505575

 version https://git-lfs.github.com/spec/v1
+oid sha256:5675c823efffcc4da240db6f8ebcd0d5c5effa2038dcb52cade133b6d93227cd
+size 299954775

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3a960ff52fcdff888c99beb87c7a497165a3e2201b3c24777ce295b37c546062
-size 232856903

 version https://git-lfs.github.com/spec/v1
+oid sha256:6889a8fdc9daf18b7aa3c6124684eaffd0fb2fba6ee0103064ad719d79d7bf0a
+size 232306103

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c964f2c88afb32affe47ab3d531c48617ebe071b393ad5eec09c1e410948b4bf
-size 232865860

 version https://git-lfs.github.com/spec/v1
+oid sha256:66061e6a38529a523db921f29bebea1086e4753e60daff773ecfe8fb48ad0b10
+size 232315060

quantize_config.json CHANGED Viewed

@@ -1,98 +1,98 @@
 {
-    "per_channel": true,
-    "reduce_range": true,
     "per_model_config": {
         "decoder_model": {
             "op_types": [
-                "Transpose",
-                "ReduceMean",
                 "Div",
-                "Gather",
                 "And",
                 "Add",
-                "Constant",
-                "Mul",
                 "Concat",
-                "Sub",
-                "Split",
-                "Pow",
-                "Tanh",
-                "ConstantOfShape",
-                "Softmax",
                 "Cast",
-                "Sqrt",
-                "Equal",
-                "Squeeze",
-                "Shape",
                 "MatMul",
                 "Where",
                 "Reshape",
-                "Unsqueeze",
-                "Slice",
-                "CumSum"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
-                "Transpose",
-                "ReduceMean",
                 "Div",
-                "Gather",
                 "And",
                 "Add",
-                "Constant",
-                "Mul",
                 "Concat",
-                "If",
-                "Sub",
-                "Split",
-                "Pow",
-                "Tanh",
-                "ConstantOfShape",
-                "Softmax",
                 "Cast",
-                "Sqrt",
-                "Equal",
-                "Squeeze",
-                "Shape",
                 "MatMul",
                 "Where",
                 "Reshape",
-                "Unsqueeze",
-                "Slice",
-                "CumSum"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
-                "Transpose",
-                "ReduceMean",
                 "Div",
-                "Gather",
                 "And",
                 "Add",
-                "Constant",
-                "Mul",
                 "Concat",
-                "Sub",
-                "Split",
-                "Pow",
-                "Tanh",
-                "ConstantOfShape",
-                "Softmax",
                 "Cast",
-                "Sqrt",
-                "Equal",
-                "Squeeze",
-                "Shape",
                 "MatMul",
                 "Where",
                 "Reshape",
-                "Unsqueeze",
-                "Slice",
-                "CumSum"
             ],
             "weight_type": "QInt8"
         }

 {
+    "per_channel": false,
+    "reduce_range": false,
     "per_model_config": {
         "decoder_model": {
             "op_types": [
+                "Tanh",
+                "Softmax",
+                "Unsqueeze",
+                "Equal",
+                "Mul",
                 "Div",
+                "Pow",
                 "And",
+                "Sub",
+                "Shape",
+                "CumSum",
+                "Transpose",
                 "Add",
+                "Slice",
                 "Concat",
                 "Cast",
+                "ReduceMean",
                 "MatMul",
                 "Where",
+                "Squeeze",
                 "Reshape",
+                "Constant",
+                "ConstantOfShape",
+                "Sqrt",
+                "Split",
+                "Gather"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
+                "Tanh",
+                "Softmax",
+                "Unsqueeze",
+                "Equal",
+                "Mul",
                 "Div",
+                "Pow",
                 "And",
+                "Sub",
+                "Shape",
+                "CumSum",
+                "Transpose",
                 "Add",
+                "Slice",
                 "Concat",
                 "Cast",
+                "ReduceMean",
                 "MatMul",
                 "Where",
+                "Squeeze",
                 "Reshape",
+                "Constant",
+                "ConstantOfShape",
+                "Sqrt",
+                "If",
+                "Split",
+                "Gather"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Tanh",
+                "Softmax",
+                "Unsqueeze",
+                "Equal",
+                "Mul",
                 "Div",
+                "Pow",
                 "And",
+                "Sub",
+                "Shape",
+                "CumSum",
+                "Transpose",
                 "Add",
+                "Slice",
                 "Concat",
                 "Cast",
+                "ReduceMean",
                 "MatMul",
                 "Where",
+                "Squeeze",
                 "Reshape",
+                "Constant",
+                "ConstantOfShape",
+                "Sqrt",
+                "Split",
+                "Gather"
             ],
             "weight_type": "QInt8"
         }