othrif
/

wav2vec_test

Automatic Speech Recognition

Inference Endpoints

Model card Files Files and versions Community

othrif commited on Mar 29, 2021

Commit

7f73f6c

•

1 Parent(s): ca734d4

Update README.md

Files changed (1) hide show

README.md +4 -5

README.md CHANGED Viewed

@@ -6,7 +6,6 @@ tags:
 - audio
 - automatic-speech-recognition
 - speech
-- xlsr-fine-tuning-week
 license: apache-2.0
 model-index:
 - name: XLSR Wav2Vec2 Egyptian by Zaid Alyafeai and Othmane Rifki
@@ -40,13 +39,13 @@ resampler = torchaudio.transforms.Resample(48_000, 16_000)
 # Preprocessing the datasets.
 # We need to read the aduio files as arrays
 def speech_file_to_array_fn(batch):
-\tspeech_array, sampling_rate = torchaudio.load(batch["path"])
-\tbatch["speech"] = resampler(speech_array).squeeze().numpy()
-\treturn batch
 test_dataset = test_dataset.map(speech_file_to_array_fn)
 inputs = processor(test_dataset["speech"][:2], sampling_rate=16_000, return_tensors="pt", padding=True)
 with torch.no_grad():
-\tlogits = model(inputs.input_values, attention_mask=inputs.attention_mask).logits
 predicted_ids = torch.argmax(logits, dim=-1)
 print("Prediction:", processor.batch_decode(predicted_ids))
 print("Reference:", test_dataset["sentence"][:2])

 - audio
 - automatic-speech-recognition
 - speech
 license: apache-2.0
 model-index:
 - name: XLSR Wav2Vec2 Egyptian by Zaid Alyafeai and Othmane Rifki
 # Preprocessing the datasets.
 # We need to read the aduio files as arrays
 def speech_file_to_array_fn(batch):
+\\tspeech_array, sampling_rate = torchaudio.load(batch["path"])
+\\tbatch["speech"] = resampler(speech_array).squeeze().numpy()
+\\treturn batch
 test_dataset = test_dataset.map(speech_file_to_array_fn)
 inputs = processor(test_dataset["speech"][:2], sampling_rate=16_000, return_tensors="pt", padding=True)
 with torch.no_grad():
+\\tlogits = model(inputs.input_values, attention_mask=inputs.attention_mask).logits
 predicted_ids = torch.argmax(logits, dim=-1)
 print("Prediction:", processor.batch_decode(predicted_ids))
 print("Reference:", test_dataset["sentence"][:2])