Merge branch 'main' of https://huggingface.co/qqhann/w2v_hf_jsut_xlsr53
Browse files
README.md
CHANGED
@@ -94,7 +94,7 @@ processor = Wav2Vec2Processor.from_pretrained("qqhann/w2v_hf_jsut_xlsr53")
|
|
94 |
model = Wav2Vec2ForCTC.from_pretrained("qqhann/w2v_hf_jsut_xlsr53")
|
95 |
model.to("cuda")
|
96 |
|
97 |
-
chars_to_ignore_regex = '[
|
98 |
# resampler = torchaudio.transforms.Resample(48_000, 16_000) # JSUT is already 16kHz
|
99 |
resampler = torchaudio.transforms.Resample(16_000, 16_000) # JSUT is already 16kHz
|
100 |
|
|
|
94 |
model = Wav2Vec2ForCTC.from_pretrained("qqhann/w2v_hf_jsut_xlsr53")
|
95 |
model.to("cuda")
|
96 |
|
97 |
+
chars_to_ignore_regex = '[\\\\,\\\\?\\\\.\\\\!\\\\-\\\\;\\\\:\\\\"\\\\“]' # TODO: adapt this list to include all special characters you removed from the data
|
98 |
# resampler = torchaudio.transforms.Resample(48_000, 16_000) # JSUT is already 16kHz
|
99 |
resampler = torchaudio.transforms.Resample(16_000, 16_000) # JSUT is already 16kHz
|
100 |
|