Spaces:

anzorq
/

w2v-bert-2.0-kbd

Paused

anzorq commited on May 16

Commit

bfb5ccb

•

1 Parent(s): 264443a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,3 +1,4 @@
 import gradio as gr
 import torch
 import torchaudio
@@ -6,6 +7,7 @@ from transformers import AutoModelForCTC, Wav2Vec2BertProcessor
 model = AutoModelForCTC.from_pretrained("anzorq/w2v-bert-2.0-kbd")
 processor = Wav2Vec2BertProcessor.from_pretrained("anzorq/w2v-bert-2.0-kbd")
 def transcribe_speech(audio):
     # Load the audio file
     waveform, sr = torchaudio.load(audio)
@@ -35,7 +37,6 @@ def transcribe_speech(audio):
     return pred_text
-# Define the Gradio interface
 interface = gr.Interface(
     fn=transcribe_speech,
     inputs=gr.Audio(sources="microphone", type="filepath"),
@@ -43,5 +44,4 @@ interface = gr.Interface(
     live=True,
 )
-# Launch the app
 interface.launch()

+import spaces
 import gradio as gr
 import torch
 import torchaudio
 model = AutoModelForCTC.from_pretrained("anzorq/w2v-bert-2.0-kbd")
 processor = Wav2Vec2BertProcessor.from_pretrained("anzorq/w2v-bert-2.0-kbd")
+@spaces.GPU
 def transcribe_speech(audio):
     # Load the audio file
     waveform, sr = torchaudio.load(audio)
     return pred_text
 interface = gr.Interface(
     fn=transcribe_speech,
     inputs=gr.Audio(sources="microphone", type="filepath"),
     live=True,
 )
 interface.launch()