qqpann
/

w2v_hf_jsut_xlsr53

@@ -94,7 +94,7 @@ processor = Wav2Vec2Processor.from_pretrained("qqhann/w2v_hf_jsut_xlsr53")
 model = Wav2Vec2ForCTC.from_pretrained("qqhann/w2v_hf_jsut_xlsr53")
 model.to("cuda")
-chars_to_ignore_regex = '[\,\?\.\!\-\;\:\"\“]'  # TODO: adapt this list to include all special characters you removed from the data
 # resampler = torchaudio.transforms.Resample(48_000, 16_000) # JSUT is already 16kHz
 resampler = torchaudio.transforms.Resample(16_000, 16_000) # JSUT is already 16kHz

 model = Wav2Vec2ForCTC.from_pretrained("qqhann/w2v_hf_jsut_xlsr53")
 model.to("cuda")
+chars_to_ignore_regex = '[\\\\,\\\\?\\\\.\\\\!\\\\-\\\\;\\\\:\\\\"\\\\“]'  # TODO: adapt this list to include all special characters you removed from the data
 # resampler = torchaudio.transforms.Resample(48_000, 16_000) # JSUT is already 16kHz
 resampler = torchaudio.transforms.Resample(16_000, 16_000) # JSUT is already 16kHz