Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +88 -0

config.json CHANGED Viewed

@@ -47,7 +47,7 @@
   "summary_proj_to_labels": true,
   "summary_type": "cls_index",
   "summary_use_proj": true,
-  "transformers_version": "4.29.2",
   "use_cache": true,
   "vocab_size": 50257,
   "window_size": 256

   "summary_proj_to_labels": true,
   "summary_type": "cls_index",
   "summary_use_proj": true,
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "vocab_size": 50257,
   "window_size": 256

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
-  "transformers_version": "4.29.2"
 }

   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7f4a8d366b57be68c4f69c93d710b360a4922f89793b25755fe897b87ccb014f
-size 663869637

 version https://git-lfs.github.com/spec/v1
+oid sha256:00871334ff4eb7926f4b07f0231858255b0fcb79402e94a4143200fd828f3dbf
+size 509478592

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b1f20e7a37ade821c43dc654410d91fba293eac2d0cfae22c2ffff81b8a52b4f
-size 664174866

 version https://git-lfs.github.com/spec/v1
+oid sha256:a93d4be13c01d658f7098461e96c67e896397c79fbbad2f512f2ad7ffdb65122
+size 518170806

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a69449f0ac812d1fa23ef46ddad943b3b770090eb00d77215de22b08e886937
-size 174103215

 version https://git-lfs.github.com/spec/v1
+oid sha256:c3934849b8b8f2c03bede375252f6d0a1f04b9e9464778ce85748011f0f1bf4b
+size 143637537

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2381edc2bbc024d9c696b2e6a78e4317fad3f76a5d738f647c5c49b0476776a1
-size 173613657

 version https://git-lfs.github.com/spec/v1
+oid sha256:769c3908bb29c78de8207d1c22c10928af1077cbcac079e61011bb3560a80c25
+size 134762187

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:748f1d9481b698f02fb103ced086020882933b3a4739b353107cb286752d8cba
-size 663877400

 version https://git-lfs.github.com/spec/v1
+oid sha256:85bc2f7c57461729ee6e2a3e87e25a4d24fe9543126a9fbf8b0380a76c6987ac
+size 509486355

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6fba5ff99a179478524373933eab362af2ac74f782ea2719727967493a50021e
-size 173623241

 version https://git-lfs.github.com/spec/v1
+oid sha256:b9d92306ccac644e25de041d14d1dee037cee58609d105a44c45150a404dbe40
+size 134771771

quantize_config.json ADDED Viewed

	@@ -0,0 +1,88 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Squeeze",
+                "Softmax",
+                "Add",
+                "Reshape",
+                "Pow",
+                "Concat",
+                "Slice",
+                "Mul",
+                "Gather",
+                "Unsqueeze",
+                "ReduceMean",
+                "Sub",
+                "Cast",
+                "Tanh",
+                "Shape",
+                "Constant",
+                "Range",
+                "MatMul",
+                "Div",
+                "Sqrt",
+                "Where",
+                "Transpose"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Squeeze",
+                "Softmax",
+                "Add",
+                "Reshape",
+                "Pow",
+                "Concat",
+                "Slice",
+                "Mul",
+                "Gather",
+                "Unsqueeze",
+                "ReduceMean",
+                "Sub",
+                "Cast",
+                "Tanh",
+                "Shape",
+                "Transpose",
+                "Range",
+                "If",
+                "MatMul",
+                "Div",
+                "Sqrt",
+                "Where",
+                "Constant"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Squeeze",
+                "Softmax",
+                "Add",
+                "Reshape",
+                "Pow",
+                "Concat",
+                "Slice",
+                "Mul",
+                "Gather",
+                "Unsqueeze",
+                "ReduceMean",
+                "Sub",
+                "Cast",
+                "Tanh",
+                "Shape",
+                "Constant",
+                "Range",
+                "MatMul",
+                "Div",
+                "Sqrt",
+                "Where",
+                "Transpose"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}