RichardErkhov
/

nicholasKluge_-_Aira-2-portuguese-124M-4bits

Text Generation

text-generation-inference

Inference Endpoints

4-bit precision

Model card Files Files and versions Community

RichardErkhov commited on Jul 20

Commit

c52105e

•

1 Parent(s): 36a8e2c

uploaded model

Files changed (1) hide show

tokenizer_config.json +56 -0

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "add_bos_token": false,
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "50257": {
+      "content": "<|startofinstruction|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "50258": {
+      "content": "<|endofcompletion|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "50259": {
+      "content": "<|endofinstruction|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "50260": {
+      "content": "<|pad|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|startofinstruction|>",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "<|endofcompletion|>",
+  "errors": "replace",
+  "full_tokenizer_file": null,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<|pad|>",
+  "sep_token": "<|endofinstruction|>",
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}