jukebox-5b-lyrics / tokenizer_config.json
ArthurZ's picture
ArthurZ HF staff
Update Tokenizer (#1)
eb38caf
raw
history blame
312 Bytes
{
"max_n_lyric_tokens": 512,
"n_genres": 5,
"tokenizer_class": "JukeboxTokenizer",
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
},
"version": [
"v2",
"v2",
"v2"
]
}