yabramuvdi commited on
Commit
4e9c575
·
1 Parent(s): ed99087

add tokenizer

Browse files
Files changed (2) hide show
  1. added_tokens.json +1 -0
  2. tokenizer_config.json +1 -1
added_tokens.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"\n": 30522}
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "../models/distilbert_base_uncased/final/", "tokenizer_class": "DistilBertTokenizer"}
 
1
+ {"do_lower_case": true, "do_basic_tokenize": true, "never_split": null, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "model_max_length": 512, "special_tokens_map_file": null, "tokenizer_file": "/home/yabra/.cache/huggingface/transformers/75abb59d7a06f4f640158a9bfcde005264e59e8d566781ab1415b139d2e4c603.7f2721073f19841be16f41b0a70b600ca6b880c8f3df6f3535cbc704371bdfa4", "name_or_path": "../models/final/", "padding": true, "tokenizer_class": "DistilBertTokenizer"}