File size: 585 Bytes
230fca6
8c24f20
230fca6
22ee534
230fca6
 
 
ca46f4b
 
b7d8cb4
22ee534
 
230fca6
 
22ee534
ca46f4b
230fca6
 
 
 
 
22ee534
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
from transformers import pipeline
from moviepy.editor import *
import gradio as gr
import requests

pipe = pipeline(model="kk90ujhun/whisper-small-hi")  # change to "your-username/the-name-you-picked"

def transcribe(my_video):
    # my_video = requests.get(my_url)
    my_audio = my_video.audio
    text = pipe(my_audio)["text"]
    return text

iface = gr.Interface(
    fn=transcribe, 
    inputs=gr.video(), 
    outputs="text",
    title="Whisper Small Hindi",
    description="Realtime demo for Hindi speech recognition using a fine-tuned Whisper small model.",
)

iface.launch()