use transformers.js converter

Browse files

Files changed (6) hide show

config.json +9 -9
onnx/model.onnx +2 -2
onnx/model_quantized.onnx +2 -2
quantize_config.json +31 -0
special_tokens_map.json +35 -5
tokenizer_config.json +51 -2

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "microsoft/xtremedistil-l6-h256-uncased",
   "architectures": [
     "BertForSequenceClassification"
   ],
@@ -24,16 +24,16 @@
   "initializer_range": 0.02,
   "intermediate_size": 1024,
   "label2id": {
-    "Society & Culture": 0,
-    "Science & Mathematics": 1,
-    "Health": 2,
-    "Education & Reference": 3,
-    "Computers & Internet": 4,
-    "Sports": 5,
     "Business & Finance": 6,
     "Entertainment & Music": 7,
     "Family & Relationships": 8,
-    "Politics & Government": 9
   },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
@@ -43,7 +43,7 @@
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
   "problem_type": "multi_label_classification",
-  "transformers_version": "4.20.1",
   "type_vocab_size": 2,
   "use_cache": true,
   "vocab_size": 30522

 {
+  "_name_or_path": "jonaskoenig/topic_classification_04",
   "architectures": [
     "BertForSequenceClassification"
   ],
   "initializer_range": 0.02,
   "intermediate_size": 1024,
   "label2id": {
     "Business & Finance": 6,
+    "Computers & Internet": 4,
+    "Education & Reference": 3,
     "Entertainment & Music": 7,
     "Family & Relationships": 8,
+    "Health": 2,
+    "Politics & Government": 9,
+    "Science & Mathematics": 1,
+    "Society & Culture": 0,
+    "Sports": 5
   },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
   "problem_type": "multi_label_classification",
+  "transformers_version": "4.36.1",
   "type_vocab_size": 2,
   "use_cache": true,
   "vocab_size": 30522

onnx/model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b16459e6e0f96cf71216ab3971284df38dbda1d5c56160b9a415ba4071d16e6
-size 51234517

 version https://git-lfs.github.com/spec/v1
+oid sha256:94e75119882aaaabebcd3abdf6ea9d3b84dac550a480bafe779e4feaf94cfa69
+size 51233961

onnx/model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5def0132b3eb0fa83de927fbe5ff4ed7372a0318e63d5af6a3507e755d70115e
-size 13215348

 version https://git-lfs.github.com/spec/v1
+oid sha256:db08136f6794c723d017b22237cba58a2185fabb09d48e1710613850bedf08bd
+size 13256259

quantize_config.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "model": {
+            "op_types": [
+                "Add",
+                "Gather",
+                "GlobalAveragePool",
+                "Tanh",
+                "MatMul",
+                "Reshape",
+                "Softmax",
+                "Slice",
+                "Reciprocal",
+                "Cast",
+                "Shape",
+                "Concat",
+                "Squeeze",
+                "Mul",
+                "Unsqueeze",
+                "Erf",
+                "Range",
+                "Transpose",
+                "Sqrt",
+                "Sub"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}

special_tokens_map.json CHANGED Viewed

@@ -1,7 +1,37 @@
 {
-  "cls_token": "[CLS]",
-  "mask_token": "[MASK]",
-  "pad_token": "[PAD]",
-  "sep_token": "[SEP]",
-  "unk_token": "[UNK]"
 }

 {
+  "cls_token": {
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "[MASK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
 }

tokenizer_config.json CHANGED Viewed

@@ -1,15 +1,64 @@
 {
   "cls_token": "[CLS]",
   "do_basic_tokenize": true,
   "do_lower_case": true,
   "mask_token": "[MASK]",
-  "name_or_path": "microsoft/xtremedistil-l6-h256-uncased",
   "never_split": null,
   "pad_token": "[PAD]",
   "sep_token": "[SEP]",
-  "special_tokens_map_file": null,
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",
   "unk_token": "[UNK]"
 }

 {
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
   "do_basic_tokenize": true,
   "do_lower_case": true,
   "mask_token": "[MASK]",
+  "max_length": 64,
+  "model_max_length": 1000000000000000019884624838656,
   "never_split": null,
+  "pad_to_multiple_of": null,
   "pad_token": "[PAD]",
+  "pad_token_type_id": 0,
+  "padding_side": "right",
   "sep_token": "[SEP]",
+  "stride": 0,
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
   "unk_token": "[UNK]"
 }