Spaces:

ANON-STUDIOS-254
/

SAUTI_V1

Sleeping

254 commited on Aug 14

Commit

2de1bff

•

1 Parent(s): d3df9be

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,5 +1,8 @@
 import gradio as gr
 import whisper
 # Load the Whisper model
 model = whisper.load_model("base")
@@ -7,17 +10,25 @@ model = whisper.load_model("base")
 def transcribe(audio):
     # Transcribe the audio file
     result = model.transcribe(audio)
-    return result['text']
 # Create the Gradio interface
-# Removed the 'source' parameter and set type to 'upload' for file uploads.
 demo = gr.Interface(
     fn=transcribe,
-    inputs=gr.Audio(type="filepath"),
-    outputs="text",
     title="Audio Transcription App",
-    description="Upload an audio file or record your voice to transcribe it to text."
 )
 # Launch the app
-demo.launch()

 import gradio as gr
 import whisper
+from wordcloud import WordCloud
+import tempfile
+import os
 # Load the Whisper model
 model = whisper.load_model("base")
 def transcribe(audio):
     # Transcribe the audio file
     result = model.transcribe(audio)
+    text = result['text']
+    # Generate a word cloud
+    wordcloud = WordCloud(width=800, height=400, background_color='white').generate(text)
+    # Save the word cloud image to a temporary file
+    with tempfile.NamedTemporaryFile(delete=False, suffix='.png') as tmpfile:
+        wordcloud.to_file(tmpfile.name)
+        return text, tmpfile.name
 # Create the Gradio interface
 demo = gr.Interface(
     fn=transcribe,
+    inputs=gr.Audio(type="filepath"),  # Allow file uploads
+    outputs=["text", gr.Image(type="filepath")],  # Output both text and image
     title="Audio Transcription App",
+    description="Upload an audio file to transcribe it to text and view a word cloud of the text."
 )
 # Launch the app
+if __name__ == "__main__":
+    demo.launch()