{ "added_tokens_decoder": { "0": { "content": "[PAD]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "100": { "content": "[UNK]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "101": { "content": "[CLS]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "102": { "content": "[SEP]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "103": { "content": "[MASK]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21128": { "content": "[Sasr]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21129": { "content": "[Pasr]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21130": { "content": "[Easr]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21131": { "content": "[Stts]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21132": { "content": "[Ptts]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21133": { "content": "[Etts]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21134": { "content": "[Sbreak]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21135": { "content": "[Pbreak]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21136": { "content": "[Ebreak]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21137": { "content": "[uv_break]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21138": { "content": "[v_break]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21139": { "content": "[lbreak]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21140": { "content": "[llbreak]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21141": { "content": "[undefine]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21142": { "content": "[laugh]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21143": { "content": "[spk_emb]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21144": { "content": "[empty_spk]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21145": { "content": "[music]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21146": { "content": "[pure]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21147": { "content": "[break_0]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21148": { "content": "[break_1]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21149": { "content": "[break_2]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21150": { "content": "[break_3]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21151": { "content": "[break_4]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21152": { "content": "[break_5]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21153": { "content": "[break_6]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21154": { "content": "[break_7]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21155": { "content": "[laugh_0]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21156": { "content": "[laugh_1]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21157": { "content": "[laugh_2]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21158": { "content": "[oral_0]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21159": { "content": "[oral_1]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21160": { "content": "[oral_2]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21161": { "content": "[oral_3]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21162": { "content": "[oral_4]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21163": { "content": "[oral_5]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21164": { "content": "[oral_6]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21165": { "content": "[oral_7]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21166": { "content": "[oral_8]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21167": { "content": "[oral_9]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21168": { "content": "[speed_0]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21169": { "content": "[speed_1]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21170": { "content": "[speed_2]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21171": { "content": "[speed_3]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21172": { "content": "[speed_4]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21173": { "content": "[speed_5]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21174": { "content": "[speed_6]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21175": { "content": "[speed_7]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21176": { "content": "[speed_8]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21177": { "content": "[speed_9]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true } }, "additional_special_tokens": [ "[Sasr]", "[Pasr]", "[Easr]", "[Stts]", "[Ptts]", "[Etts]", "[Sbreak]", "[Pbreak]", "[Ebreak]", "[uv_break]", "[v_break]", "[lbreak]", "[llbreak]", "[undefine]", "[laugh]", "[spk_emb]", "[empty_spk]", "[music]", "[pure]", "[break_0]", "[break_1]", "[break_2]", "[break_3]", "[break_4]", "[break_5]", "[break_6]", "[break_7]", "[laugh_0]", "[laugh_1]", "[laugh_2]", "[oral_0]", "[oral_1]", "[oral_2]", "[oral_3]", "[oral_4]", "[oral_5]", "[oral_6]", "[oral_7]", "[oral_8]", "[oral_9]", "[speed_0]", "[speed_1]", "[speed_2]", "[speed_3]", "[speed_4]", "[speed_5]", "[speed_6]", "[speed_7]", "[speed_8]", "[speed_9]" ], "clean_up_tokenization_spaces": true, "cls_token": "[CLS]", "do_basic_tokenize": true, "do_lower_case": true, "mask_token": "[MASK]", "max_length": 256, "model_max_length": 1000000000000000019884624838656, "never_split": null, "pad_to_multiple_of": null, "pad_token": "[PAD]", "pad_token_type_id": 0, "padding_side": "right", "sep_token": "[SEP]", "stride": 0, "strip_accents": null, "tokenize_chinese_chars": true, "tokenizer_class": "BertTokenizer", "truncation_side": "right", "truncation_strategy": "longest_first", "unk_token": "[UNK]" }