Speech-ChatGPT-Speech

Runtime error

Yusin commited on Dec 11, 2022

Commit

9922164

1 Parent(s): 90e3812

Update app.py (#10)

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,9 +6,9 @@ default_lang = "en"
 # ChatGPT
 from pyChatGPT import ChatGPT
-#import whisper
-#whisper_model = whisper.load_model("small")
-whisper = gr.Blocks.load(name="spaces/sanchit-gandhi/whisper-large-v2")
 import os
 session_token = os.environ.get('SessionToken')
@@ -46,30 +46,6 @@ def chat_hf(audio, custom_token, language):
     return whisper_text, gpt_response, fp.name
 # whisper
-#def translate(audio):
-#    print("""
-#    —
-#    Sending audio to Whisper ...
-#    —
-#    """)
-#
-#    audio = whisper.load_audio(audio)
-#    audio = whisper.pad_or_trim(audio)
-#
-#    mel = whisper.log_mel_spectrogram(audio).to(whisper_model.device)
-#
-#    _, probs = whisper_model.detect_language(mel)
-#
-#    transcript_options = whisper.DecodingOptions(task="transcribe", fp16 = False)
-#
-#    transcription = whisper.decode(whisper_model, mel, transcript_options)
-#
-#    print("language spoken: " + transcription.language)
-#    print("transcript: " + transcription.text)
-#    print("———————————————————————————————————————————")
-#
-#    return transcription.text
 def translate(audio):
     print("""
     —
@@ -77,9 +53,33 @@ def translate(audio):
     —
     """)
-    text_result = whisper(audio, None, "transcribe", fn_index=0)
-    print(text_result)
-    return text_result
 with gr.Blocks() as blocks:

 # ChatGPT
 from pyChatGPT import ChatGPT
+import whisper
+whisper_model = whisper.load_model("small")
+#whisper = gr.Blocks.load(name="spaces/sanchit-gandhi/whisper-large-v2")
 import os
 session_token = os.environ.get('SessionToken')
     return whisper_text, gpt_response, fp.name
 # whisper
 def translate(audio):
     print("""
     —
     —
     """)
+    audio = whisper.load_audio(audio)
+    audio = whisper.pad_or_trim(audio)
+    mel = whisper.log_mel_spectrogram(audio).to(whisper_model.device)
+    _, probs = whisper_model.detect_language(mel)
+    transcript_options = whisper.DecodingOptions(task="transcribe", fp16 = False)
+    transcription = whisper.decode(whisper_model, mel, transcript_options)
+    print("language spoken: " + transcription.language)
+    print("transcript: " + transcription.text)
+    print("———————————————————————————————————————————")
+    return transcription.text
+#def translate(audio):
+#    print("""
+#    —
+#    Sending audio to Whisper ...
+#    —
+#    """)
+#
+#    text_result = whisper(audio, None, "transcribe", fn_index=0)
+#    print(text_result)
+#    return text_result
 with gr.Blocks() as blocks: