Add bos and eos token to tokenizer config.

https://huggingface.co/meta-llama/Llama-3.2-1B/blob/main/tokenizer_config.json
Update to be similar to llama tokenizer config.

Files changed (1) hide show

tokenizer_config.json CHANGED Viewed

@@ -33,7 +33,9 @@
       "special": true
     }
   },
   "clean_up_tokenization_spaces": true,
   "model_max_length": 1000000000000000019884624838656,
   "tokenizer_class": "PreTrainedTokenizerFast"
 }

       "special": true
     }
   },
+  "bos_token": "<|begin_of_text|>",
   "clean_up_tokenization_spaces": true,
+  "eos_token": "<|end_of_text|>",
   "model_max_length": 1000000000000000019884624838656,
   "tokenizer_class": "PreTrainedTokenizerFast"
 }