Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +62 -62
tokenizer.json +1 -0

config.json CHANGED Viewed

@@ -37,7 +37,7 @@
   "no_bias": true,
   "norm_type": "low_precision_layernorm",
   "resid_pdrop": 0.0,
-  "transformers_version": "4.32.1",
   "use_cache": false,
   "verbose": 0,
   "vocab_size": 50432

   "no_bias": true,
   "norm_type": "low_precision_layernorm",
   "resid_pdrop": 0.0,
+  "transformers_version": "4.33.0.dev0",
   "use_cache": false,
   "verbose": 0,
   "vocab_size": 50432

generation_config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
   "_from_model_config": true,
-  "transformers_version": "4.32.1",
   "use_cache": false
 }

 {
   "_from_model_config": true,
+  "transformers_version": "4.33.0.dev0",
   "use_cache": false
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0e434ce50a6b81fd4b234c5d4b1d29bdd0c48e1dca27c435d3f76b5d0f6f030f
-size 1621899428

 version https://git-lfs.github.com/spec/v1
+oid sha256:4ef3885afff8c3a3e0a7f10a662556410b3059f14faa89961e166e51ef63c4e2
+size 1415330022

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a3d5e8f131d5aac51c90315ce723147eb7b7d875fb7d7c7fdd7eb98123ce13bb
-size 1622503619

 version https://git-lfs.github.com/spec/v1
+oid sha256:2e16283f568a32bd8e9f8716e21a5af318e6ba5438b82d76a13265a4661494fc
+size 1415934308

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:620cfd14fb3e3618226e8468406c55a17b2a11ee417e47a18855d4fb264589f7
-size 408595992

 version https://git-lfs.github.com/spec/v1
+oid sha256:95fdbeec3fc8c6116c41b2153af4de72ca014a3466fa24b1edbf8904af9bae39
+size 356700610

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a7a2ecfd618b43a6a816381bcb400696104217c1f541b8db7f891504337cd84c
-size 407714462

 version https://git-lfs.github.com/spec/v1
+oid sha256:54baba9918925344934e39d5ccc30d10bba3da938240fed4a09e072c6323549d
+size 355819455

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:54d7dc2514a0deceb5f70fd54c8e6f4a2a8bc5e78030f3f501fdc72985a8fd00
-size 1621900820

 version https://git-lfs.github.com/spec/v1
+oid sha256:923d582c0e52660c047cae978a5288e45bab47ac4bd60829130ef68129d228d8
+size 1415331414

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c636d0f47f3a5fc2b99b2a8c613bcafc7fa4fb2790a87b198ea94daaf4ebe9da
-size 407715249

 version https://git-lfs.github.com/spec/v1
+oid sha256:1b26ef4475e8a6e5fff3fc6c76ca1a3fc84b7fff75734969f52c83055ce2ff5d
+size 355820242

quantize_config.json CHANGED Viewed

@@ -2,99 +2,99 @@
     "per_channel": true,
     "reduce_range": true,
     "per_model_config": {
-        "decoder_model_merged": {
             "op_types": [
-                "Range",
-                "If",
-                "Concat",
-                "Equal",
-                "ReduceMean",
-                "Sub",
-                "Cast",
-                "Mul",
-                "Reshape",
                 "ConstantOfShape",
-                "MatMul",
                 "Erf",
-                "Gather",
-                "Unsqueeze",
-                "Expand",
-                "Not",
-                "Less",
                 "Constant",
-                "Slice",
                 "ScatterND",
                 "Div",
                 "Shape",
-                "Add",
-                "Pow",
-                "Softmax",
                 "Sqrt",
-                "Where",
-                "Or",
-                "Transpose"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model": {
             "op_types": [
-                "Range",
-                "Concat",
-                "Equal",
-                "ReduceMean",
-                "Sub",
-                "Cast",
-                "Mul",
-                "Reshape",
                 "ConstantOfShape",
-                "MatMul",
                 "Erf",
-                "Gather",
-                "Unsqueeze",
-                "Expand",
-                "Not",
-                "Less",
                 "Constant",
-                "Slice",
                 "ScatterND",
                 "Div",
                 "Shape",
-                "Add",
-                "Pow",
-                "Softmax",
                 "Sqrt",
-                "Where",
-                "Or",
-                "Transpose"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
-                "Concat",
-                "Equal",
-                "ReduceMean",
-                "Sub",
-                "Cast",
-                "Mul",
-                "Reshape",
                 "ConstantOfShape",
-                "MatMul",
                 "Erf",
-                "Gather",
                 "Unsqueeze",
                 "Expand",
                 "Not",
-                "Constant",
-                "Slice",
-                "Div",
                 "Shape",
-                "Add",
-                "Pow",
-                "Softmax",
                 "Sqrt",
-                "Where",
-                "Transpose"
             ],
             "weight_type": "QInt8"
         }

     "per_channel": true,
     "reduce_range": true,
     "per_model_config": {
+        "decoder_model": {
             "op_types": [
+                "Or",
+                "Pow",
                 "ConstantOfShape",
+                "Mul",
+                "Slice",
+                "Transpose",
                 "Erf",
+                "MatMul",
+                "Cast",
                 "Constant",
                 "ScatterND",
+                "Sub",
+                "Unsqueeze",
+                "Range",
+                "Add",
+                "Equal",
+                "Concat",
+                "ReduceMean",
+                "Where",
+                "Less",
                 "Div",
+                "Expand",
+                "Reshape",
+                "Not",
                 "Shape",
+                "Gather",
                 "Sqrt",
+                "Softmax"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Or",
+                "Pow",
                 "ConstantOfShape",
+                "Mul",
+                "Slice",
+                "Transpose",
                 "Erf",
+                "MatMul",
+                "Cast",
                 "Constant",
                 "ScatterND",
+                "Sub",
+                "Unsqueeze",
+                "Range",
+                "Add",
+                "Equal",
+                "Concat",
+                "ReduceMean",
+                "Where",
+                "Less",
                 "Div",
+                "Expand",
+                "Reshape",
+                "Not",
                 "Shape",
+                "If",
+                "Gather",
                 "Sqrt",
+                "Softmax"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Pow",
                 "ConstantOfShape",
+                "Mul",
+                "Slice",
+                "Transpose",
                 "Erf",
+                "MatMul",
+                "Cast",
+                "Constant",
+                "Sub",
                 "Unsqueeze",
+                "Add",
+                "Equal",
+                "Concat",
+                "ReduceMean",
+                "Where",
+                "Div",
+                "Reshape",
                 "Expand",
                 "Not",
                 "Shape",
+                "Gather",
                 "Sqrt",
+                "Softmax"
             ],
             "weight_type": "QInt8"
         }

tokenizer.json CHANGED Viewed

@@ -50,6 +50,7 @@
     "continuing_subword_prefix": null,
     "end_of_word_suffix": null,
     "fuse_unk": false,
     "vocab": {
       "<|endoftext|>": 0,
       "<|padding|>": 1,

     "continuing_subword_prefix": null,
     "end_of_word_suffix": null,
     "fuse_unk": false,
+    "byte_fallback": false,
     "vocab": {
       "<|endoftext|>": 0,
       "<|padding|>": 1,