Spaces:

DSatishchandra
/

Voicebot

Runtime error

App Files Files Community

DSatishchandra commited on Dec 18, 2024

Commit

49e2d43

verified ·

1 Parent(s): c218b1a

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -6

app.py CHANGED Viewed

@@ -2,7 +2,7 @@ import gradio as gr
 import speech_recognition as sr
 from gtts import gTTS
 import os
-from playsound import playsound  # Import playsound library
 from transformers import pipeline
 # Initialize recognizer for speech recognition
@@ -26,11 +26,19 @@ def process_order(order):
     else:
         return "Sorry, we didn't catch that. Please try again."
-# Function to handle speech recognition
 def recognize_speech(audio):
     try:
-        # Recognize speech using SpeechRecognition
-        text = recognizer.recognize_google(audio)
         response = process_order(text)
         # Using gTTS to respond back with speech
@@ -42,6 +50,7 @@ def recognize_speech(audio):
         return response
     except Exception as e:
         return "Sorry, I could not understand."
 # Gradio Interface for the app
@@ -49,8 +58,8 @@ def create_gradio_interface():
     with gr.Blocks() as demo:
         gr.Markdown("## AI Voice Bot for Food Ordering")
-        # Audio Input: User speaks into microphone
-        audio_input = gr.Audio(type="numpy", label="Speak to the bot")
         # Display the bot's response after recognition
         output_text = gr.Textbox(label="Bot Response")

 import speech_recognition as sr
 from gtts import gTTS
 import os
+from playsound import playsound
 from transformers import pipeline
 # Initialize recognizer for speech recognition
     else:
         return "Sorry, we didn't catch that. Please try again."
+# Function to handle speech recognition from audio files or microphone
 def recognize_speech(audio):
     try:
+        # If audio is from file, use SpeechRecognition to convert speech to text
+        if isinstance(audio, str):  # Audio file input
+            with sr.AudioFile(audio) as source:
+                audio_data = recognizer.record(source)
+                text = recognizer.recognize_google(audio_data)
+        else:  # Audio from microphone input
+            text = recognizer.recognize_google(audio)
+        print(f"Recognized text: {text}")  # Print the recognized text for debugging
         response = process_order(text)
         # Using gTTS to respond back with speech
         return response
     except Exception as e:
+        print(f"Error: {e}")  # Print the error for debugging
         return "Sorry, I could not understand."
 # Gradio Interface for the app
     with gr.Blocks() as demo:
         gr.Markdown("## AI Voice Bot for Food Ordering")
+        # Audio Input: User speaks into microphone or uploads a file
+        audio_input = gr.Audio(type="file", label="Speak to the bot (Upload or Record Audio)")
         # Display the bot's response after recognition
         output_text = gr.Textbox(label="Bot Response")