|
{ |
|
"version": "1.0", |
|
"truncation": { |
|
"direction": "Right", |
|
"max_length": 2048, |
|
"strategy": "LongestFirst", |
|
"stride": 0 |
|
}, |
|
"padding": null, |
|
"added_tokens": [ |
|
{ |
|
"id": 0, |
|
"content": "[UNK]", |
|
"single_word": false, |
|
"lstrip": false, |
|
"rstrip": false, |
|
"normalized": false, |
|
"special": true |
|
}, |
|
{ |
|
"id": 1, |
|
"content": "[BOS]", |
|
"single_word": false, |
|
"lstrip": false, |
|
"rstrip": false, |
|
"normalized": false, |
|
"special": true |
|
}, |
|
{ |
|
"id": 2, |
|
"content": "[EOS]", |
|
"single_word": false, |
|
"lstrip": false, |
|
"rstrip": false, |
|
"normalized": false, |
|
"special": true |
|
}, |
|
{ |
|
"id": 3, |
|
"content": "[PAD]", |
|
"single_word": false, |
|
"lstrip": false, |
|
"rstrip": false, |
|
"normalized": false, |
|
"special": true |
|
} |
|
], |
|
"normalizer": null, |
|
"pre_tokenizer": { |
|
"type": "Whitespace" |
|
}, |
|
"post_processor": { |
|
"type": "TemplateProcessing", |
|
"single": [ |
|
{ |
|
"SpecialToken": { |
|
"id": "[BOS]", |
|
"type_id": 0 |
|
} |
|
}, |
|
{ |
|
"Sequence": { |
|
"id": "A", |
|
"type_id": 0 |
|
} |
|
}, |
|
{ |
|
"SpecialToken": { |
|
"id": "[EOS]", |
|
"type_id": 0 |
|
} |
|
} |
|
], |
|
"pair": [ |
|
{ |
|
"Sequence": { |
|
"id": "A", |
|
"type_id": 0 |
|
} |
|
}, |
|
{ |
|
"Sequence": { |
|
"id": "B", |
|
"type_id": 1 |
|
} |
|
} |
|
], |
|
"special_tokens": { |
|
"[BOS]": { |
|
"id": "[BOS]", |
|
"ids": [ |
|
1 |
|
], |
|
"tokens": [ |
|
"[BOS]" |
|
] |
|
}, |
|
"[EOS]": { |
|
"id": "[EOS]", |
|
"ids": [ |
|
2 |
|
], |
|
"tokens": [ |
|
"[EOS]" |
|
] |
|
} |
|
} |
|
}, |
|
"decoder": null, |
|
"model": { |
|
"type": "BPE", |
|
"dropout": null, |
|
"unk_token": "[UNK]", |
|
"continuing_subword_prefix": null, |
|
"end_of_word_suffix": null, |
|
"fuse_unk": false, |
|
"byte_fallback": false, |
|
"vocab": { |
|
"[UNK]": 0, |
|
"[BOS]": 1, |
|
"[EOS]": 2, |
|
"[PAD]": 3, |
|
"0": 4, |
|
"1": 5, |
|
"2": 6, |
|
"3": 7, |
|
"4": 8, |
|
"5": 9, |
|
"6": 10, |
|
"7": 11, |
|
"8": 12, |
|
"9": 13, |
|
"43": 14, |
|
"32": 15, |
|
"25": 16, |
|
"33": 17, |
|
"23": 18, |
|
"20": 19, |
|
"30": 20, |
|
"14": 21, |
|
"39": 22, |
|
"13": 23, |
|
"27": 24, |
|
"22": 25, |
|
"29": 26, |
|
"15": 27, |
|
"38": 28, |
|
"16": 29, |
|
"49": 30, |
|
"48": 31, |
|
"17": 32, |
|
"34": 33, |
|
"47": 34, |
|
"42": 35, |
|
"12": 36, |
|
"45": 37, |
|
"46": 38, |
|
"37": 39, |
|
"35": 40, |
|
"18": 41, |
|
"41": 42, |
|
"40": 43, |
|
"44": 44, |
|
"28": 45, |
|
"36": 46, |
|
"24": 47, |
|
"21": 48, |
|
"26": 49, |
|
"11": 50, |
|
"19": 51, |
|
"10": 52, |
|
"31": 53 |
|
}, |
|
"merges": [ |
|
"4 3", |
|
"3 2", |
|
"2 5", |
|
"3 3", |
|
"2 3", |
|
"2 0", |
|
"3 0", |
|
"1 4", |
|
"3 9", |
|
"1 3", |
|
"2 7", |
|
"2 2", |
|
"2 9", |
|
"1 5", |
|
"3 8", |
|
"1 6", |
|
"4 9", |
|
"4 8", |
|
"1 7", |
|
"3 4", |
|
"4 7", |
|
"4 2", |
|
"1 2", |
|
"4 5", |
|
"4 6", |
|
"3 7", |
|
"3 5", |
|
"1 8", |
|
"4 1", |
|
"4 0", |
|
"4 4", |
|
"2 8", |
|
"3 6", |
|
"2 4", |
|
"2 1", |
|
"2 6", |
|
"1 1", |
|
"1 9", |
|
"1 0", |
|
"3 1" |
|
] |
|
} |
|
} |