Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +125 -0

config.json CHANGED Viewed

@@ -70,7 +70,7 @@
       "num_beams": 4
     }
   },
-  "transformers_version": "4.29.2",
   "use_cache": true,
   "vocab_size": 50264
 }

       "num_beams": 4
     }
   },
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "vocab_size": 50264
 }

generation_config.json CHANGED Viewed

@@ -12,5 +12,5 @@
   "no_repeat_ngram_size": 3,
   "num_beams": 4,
   "pad_token_id": 1,
-  "transformers_version": "4.29.2"
 }

   "no_repeat_ngram_size": 3,
   "num_beams": 4,
   "pad_token_id": 1,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:77ad751280773fe931bfd719c9f16d136b7a3b03bf8ab4f7500cb73cba380a65
-size 819558619

 version https://git-lfs.github.com/spec/v1
+oid sha256:a34147806885ea37601ae6d91a2598a93acc78db07a06e637f2f1e6ef9c90699
+size 819581461

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1e7290c55a2b6b83daa9d24b812c114aca43191d079493afcc369eb7a6716c10
-size 819782600

 version https://git-lfs.github.com/spec/v1
+oid sha256:2c15a6f30dad41c3265f6786dbd850b6c563d9e6cca0197a1517822ccf2cb44b
+size 819827967

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d90579b6d28ad792b9940bdc15ba558d6ecc47f3c4226c6e4698f547e741f9bd
-size 206763801

 version https://git-lfs.github.com/spec/v1
+oid sha256:06a8b2aad1811a49576bb1fae43142bd91fc90204065a363191268ee84a7cd28
+size 206825235

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7a9b99fec32f15ede8b22e1d389e2f98124dc4c38a016b7097cb8b736be99820
-size 206407053

 version https://git-lfs.github.com/spec/v1
+oid sha256:b704da825ee605a2576a88093fed2442978b00309d3a576337ae2fe1ac843fcf
+size 206437988

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9c8197cf1d02b2e64f77fb70fbe4b15d6f1b654feb839cc0484103c41b9efb61
-size 769135510

 version https://git-lfs.github.com/spec/v1
+oid sha256:145e78c5a35e7bd92f57f58b17b9538c202ccd2e4b233b8f4deb2d91e3454a32
+size 769158110

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:beffad2e331c6b61ecbe52dd8c1015b5e266de3ec97dae286ad6cf9dc199f597
-size 193644092

 version https://git-lfs.github.com/spec/v1
+oid sha256:8615325c7835f7734c6c6ed53264dc85f9954db1f176697cf033fc596fc7f52c
+size 193674668

quantize_config.json ADDED Viewed

	@@ -0,0 +1,125 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Cast",
+                "Transpose",
+                "Slice",
+                "Concat",
+                "Unsqueeze",
+                "Where",
+                "Pow",
+                "Expand",
+                "MatMul",
+                "Sub",
+                "Div",
+                "Equal",
+                "Mul",
+                "Gather",
+                "Constant",
+                "Softmax",
+                "Shape",
+                "Squeeze",
+                "ConstantOfShape",
+                "Range",
+                "Less",
+                "Add",
+                "Sqrt",
+                "Reshape",
+                "ReduceMean",
+                "Erf"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Cast",
+                "If",
+                "Transpose",
+                "Slice",
+                "Concat",
+                "Unsqueeze",
+                "Where",
+                "Pow",
+                "Expand",
+                "MatMul",
+                "Sub",
+                "Div",
+                "Equal",
+                "Mul",
+                "Gather",
+                "Constant",
+                "Softmax",
+                "Shape",
+                "Squeeze",
+                "ConstantOfShape",
+                "Range",
+                "Less",
+                "Add",
+                "Sqrt",
+                "Reshape",
+                "ReduceMean",
+                "Erf"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Cast",
+                "Transpose",
+                "Concat",
+                "Unsqueeze",
+                "Where",
+                "Pow",
+                "Expand",
+                "MatMul",
+                "Sub",
+                "Div",
+                "Equal",
+                "Mul",
+                "Gather",
+                "Constant",
+                "Softmax",
+                "Shape",
+                "ConstantOfShape",
+                "Range",
+                "Add",
+                "Sqrt",
+                "Reshape",
+                "ReduceMean",
+                "Erf"
+            ],
+            "weight_type": "QInt8"
+        },
+        "encoder_model": {
+            "op_types": [
+                "Cast",
+                "Transpose",
+                "Concat",
+                "Unsqueeze",
+                "Where",
+                "Pow",
+                "Expand",
+                "MatMul",
+                "Sub",
+                "Div",
+                "Equal",
+                "Mul",
+                "Gather",
+                "Constant",
+                "Softmax",
+                "Shape",
+                "ConstantOfShape",
+                "Range",
+                "Add",
+                "Sqrt",
+                "Reshape",
+                "ReduceMean",
+                "Erf"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}