File size: 509 Bytes
8250eed
 
08d8d00
 
 
 
bfe22ad
 
 
 
1
2
3
4
5
6
7
8
9
10
from transformers import PreTrainedTokenizerFast

class ModernDecoderBERTTokenizer(PreTrainedTokenizerFast):
    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        
    def build_inputs_with_special_tokens(self, token_ids_0, token_ids_1=None):
        if token_ids_1 is None:
            return [id for id in token_ids_0 if id != self.eos_token_id]
        return [id for id in token_ids_0 if id != self.eos_token_id] + [id for id in token_ids_1 if id != self.eos_token_id]