MultiMed / test.py
not-lain's picture
fixed audio interface
be980dd
raw
history blame
823 Bytes
import dotenv
import base64
import os
import requests
import gradio as gr
import PIL
import numpy as np
from scipy.io.wavfile import write
import gradio_client as grc
dotenv.load_dotenv()
client = grc.Client("facebook/seamless_m4t")
def process_image(audio):
# audio_name = f"{np.random.randint(0, 100)}.jpg"
audio_name = f"{1}.wav"
sr, data = audio
write(audio_name, sr, data.astype(np.int16))
out = client.predict(
"S2TT",
"file",
None,
audio_name,
"",
"French",# source language
"English",# target language
api_name="/run",
)
out = out[1] # get the text
try :
return f"{out}"
except Exception as e :
return f"{e}"
iface = gr.Interface(fn=process_image, inputs="audio", outputs="text")
iface.launch()