Spaces:

neke-leo
/

phone-bot-demo

Runtime error

App Files Files Community

neke-leo commited on Sep 25, 2023

Commit

42b9715

•

1 Parent(s): 8407ed4

ENH: Add new version

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +1 -0
.gitignore +0 -1
all_questions_audio.json +3 -0
app.py +95 -29
audio/0014ea63-6970-447d-9f37-d7ec600f2a18.mp3 +0 -0
audio/0040266e-5e79-41dd-943d-e8b414be79b9.mp3 +0 -0
audio/007de689-48fa-4ad4-924e-a32b5604a669.mp3 +0 -0
audio/00dd1484-fa96-4edd-b2c0-67a36e72814b.mp3 +0 -0
audio/014d0e79-346a-4184-aa0c-fde1d6cad727.mp3 +0 -0
audio/01679648-46e1-4b8d-bac4-a4efc1c03f4e.mp3 +0 -0
audio/01cb8d82-b08a-4a9e-b6fb-0d23d1b1d620.mp3 +0 -0
audio/0235968b-0e0e-427f-a053-d77b184d1217.mp3 +0 -0
audio/02869a46-696d-4545-8286-328b2bf9c38f.mp3 +0 -0
audio/03481c4a-b5bd-4cfd-b2a0-ed6e257e4612.mp3 +0 -0
audio/034e0813-b5a0-4b2b-ab22-beeda411b23b.mp3 +0 -0
audio/0387ccf5-bc33-4b3d-bca3-b7659b9d4541.mp3 +0 -0
audio/03c1a729-f086-4874-8543-8e319c8c0a38.mp3 +0 -0
audio/03dc1ece-261b-4368-b86b-144738bb9ed3.mp3 +0 -0
audio/0480beb7-4513-4d37-8745-c0b0916f2f11.mp3 +0 -0
audio/0552041a-5470-4a4e-b758-fcc96d5d5721.mp3 +0 -0
audio/060eb813-521d-4db8-8260-4d1f34b65694.mp3 +0 -0
audio/06497605-8980-411a-b885-ce688aa791eb.mp3 +0 -0
audio/064a1cd8-0317-4084-a7f4-cc62c501eb25.mp3 +0 -0
audio/066d87df-72a7-4637-8253-1290effb8d3a.mp3 +0 -0
audio/067bb319-ede8-4c58-990e-a14f4a76bfc7.mp3 +0 -0
audio/068bb98d-7be4-47bc-87f5-bfa56fc6414f.mp3 +0 -0
audio/06ecc371-3970-4350-8715-ac9bbf503c2f.mp3 +0 -0
audio/07042220-5613-427c-8d8b-4b4586e6cb1a.mp3 +0 -0
audio/074edb8e-3c8b-45f9-86fb-8b35bddfe92d.mp3 +0 -0
audio/0794c21d-b363-4dcc-974d-85ec010a6fe2.mp3 +0 -0
audio/07d14014-aa0a-4646-9a14-03c444e173c3.mp3 +0 -0
audio/07f8546c-cf3d-4893-b904-5afb3127dc77.mp3 +0 -0
audio/0841bbb2-da04-4fd3-acad-5348ec85c912.mp3 +0 -0
audio/088385df-9037-4047-bda7-ebc32886aed3.mp3 +0 -0
audio/08e4286a-e5a4-4de9-9221-dd777f685078.mp3 +0 -0
audio/08f5081b-7d12-47d7-bf12-d41e645a4ef6.mp3 +0 -0
audio/08f6c839-018a-4e7f-802c-29ac819ef0d1.mp3 +0 -0
audio/09ae3b98-7857-4505-aef6-445819aa4f92.mp3 +0 -0
audio/09b2d932-cba9-4192-b356-a2c27f964055.mp3 +0 -0
audio/0a047afb-a55f-4d3d-8082-513fec3507cf.mp3 +0 -0
audio/0a0fb2fd-ab1c-47a8-98c2-8af70f81c191.mp3 +0 -0
audio/0a3972f3-17b4-4207-97d7-2e4df35777a3.mp3 +0 -0
audio/0a68b75c-59b2-45a8-9fe1-2ebc8638685b.mp3 +0 -0
audio/0a92c22e-1167-444b-a8dd-e9a544bed022.mp3 +0 -0
audio/0a9e947f-8ae3-4eaf-b2cf-178e8f4d1f52.mp3 +0 -0
audio/0ad73ebb-db96-48d4-b428-36ee00b29ae8.mp3 +0 -0
audio/0aebd9f7-7cd3-4c3d-aef1-eaa05e54d6ee.mp3 +0 -0
audio/0b522ac8-4e0f-4dab-9f93-7571525ffb74.mp3 +0 -0
audio/0c1552e3-b333-47cc-bee7-5149c01c85e4.mp3 +0 -0
audio/0c2e0437-761c-4cdc-9874-ddbd7ffe03e0.mp3 +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+all_questions_audio.json filter=lfs diff=lfs merge=lfs -text

.gitignore CHANGED Viewed

@@ -1,6 +1,5 @@
 # ignore old_files folder
 old_files
-audio
 conversations
 # ignore pyc files
 *.pyc

 # ignore old_files folder
 old_files
 conversations
 # ignore pyc files
 *.pyc

all_questions_audio.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8413b2ff23d94e583c395e43760627b4252f6644be54df9b3c97b2523ae3f54f
+size 40038038

app.py CHANGED Viewed

@@ -3,8 +3,7 @@ import os
 import openai
-from audio_utils import text_to_speech, text_to_speech_polly
-from openai_prompts import contextualize_question
 from openai_utils import get_embedding, whisper_transcription
 from vector_db import LanceVectorDb, QnA
@@ -12,16 +11,14 @@ db = LanceVectorDb("qna_db")
 OPENAI_KEY = os.environ["OPENAI_KEY"]
 openai.api_key = OPENAI_KEY
-if len(db.table.to_pandas()) == 0:
     print("Empty db, trying to load qna's from json file")
     try:
-        db.init_from_qna_json("all_questions.json")
         print("Initialized db from json file")
     except Exception as exception:
         raise Exception("Failed to initialize db from json file") from exception
 import os
@@ -30,7 +27,7 @@ def ensure_dir(directory):
         os.makedirs(directory)
-ensure_dir("audio")
 import random
@@ -41,10 +38,10 @@ def red(text):
     return f'\x1b[31m"{text}"\x1b[0m'
-def query_database(prompt: str):
     print("Querying database for question:", prompt)
     embedding = get_embedding(prompt)
-    qnas = db.get_qna(embedding, lang="en", limit=3)
     print("Total_qnas:", len(qnas), [qna.score for qna in qnas])
     qnas = [qna for qna in qnas if qna.score < 0.49]
     print("Filtered_qnas:", len(qnas))
@@ -57,6 +54,7 @@ available_functions = {
 conversation_folder = f"conversations/{random.randint(0, 10000)}"
 ensure_dir(conversation_folder)
 SYSTEM_PROMPT = (
     "You are a question answering assistant.\n"
@@ -83,30 +81,43 @@ def bot_respond(user_query, history: list):
     chat_messages = history["chat_messages"]
-    user_query = contextualize_question(user_query, chat_messages)
-    path = os.path.join(conversation_folder, f"step_{step}_qna.json")
-    qnas = query_database(user_query)
-    prompt = f"The user said: ---{user_query}---\n\n"
     context = context_format(qnas)
     prompt += context
-    qna_messages = [
-        {
-            "role": "system",
-            "content": SYSTEM_PROMPT,
-        },
-        {
-            "role": "user",
-            "content": prompt,
-        },
-    ]
     completion = openai.ChatCompletion.create(
-        model="gpt-3.5-turbo", messages=qna_messages, temperature=0
     )
     response_message = completion["choices"][0]["message"]
@@ -114,6 +125,12 @@ def bot_respond(user_query, history: list):
     path = os.path.join(conversation_folder, f"step_{step}_qna.json")
     with open(path, "w") as f:
         json.dump(
             {
@@ -124,11 +141,28 @@ def bot_respond(user_query, history: list):
             indent=4,
         )
-    chat_messages.append({"role": "assistant", "content": bot_response})
     step += 1
-    return bot_response, prompt
 import random
@@ -143,11 +177,29 @@ def display_history(conversation):
     return conversation_string
 def handle_audiofile(audio_filepath: str, history: list):
     user_question = whisper_transcription(audio_filepath)
     print("Transcription", user_question)
-    bot_response_text, context_prompt = bot_respond(user_question, history)
     if bot_response_text:
         lang = detect(bot_response_text)
@@ -155,12 +207,20 @@ def handle_audiofile(audio_filepath: str, history: list):
     else:
         lang = "en"
     if lang not in ["en", "de"]:
         lang = "en"
-    output_filepath = os.path.join("audio", f"output_{random.randint(0, 1000)}.mp3")
     text_to_speech_polly(bot_response_text, lang, output_filepath)
     context_prompt += f"<<tts language>> : {lang}\n"
     context_prompt += f"<<tts text>> : {bot_response_text}\n"
@@ -171,6 +231,7 @@ def handle_audiofile(audio_filepath: str, history: list):
         context_prompt,
         display_history(history["chat_messages"]),
         output_filepath,
     )
@@ -198,6 +259,9 @@ with gr.Blocks() as demo:
         )
         conversation_history = gr.Textbox(label="Conversation history")
     # when the audio input is stopped, run the transcribe function
     audio_input.stop_recording(
         handle_audiofile,
@@ -209,9 +273,11 @@ with gr.Blocks() as demo:
             context_info,
             conversation_history,
             output_audio,
         ],
     )
 username = os.environ["GRADIO_USERNAME"]
 password = os.environ["GRADIO_PASSWORD"]

 import openai
+from audio_utils import text_to_speech_polly
 from openai_utils import get_embedding, whisper_transcription
 from vector_db import LanceVectorDb, QnA
 OPENAI_KEY = os.environ["OPENAI_KEY"]
 openai.api_key = OPENAI_KEY
+if not db.table or len(db.table.to_pandas()) == 0:
     print("Empty db, trying to load qna's from json file")
     try:
+        db.init_from_qna_json("all_questions_audio.json")
         print("Initialized db from json file")
     except Exception as exception:
         raise Exception("Failed to initialize db from json file") from exception
 import os
         os.makedirs(directory)
+ensure_dir("audio_temp")
 import random
     return f'\x1b[31m"{text}"\x1b[0m'
+def query_database(prompt: str, filters: dict = {}):
     print("Querying database for question:", prompt)
     embedding = get_embedding(prompt)
+    qnas = db.get_qna(embedding, filters=filters, limit=3)
     print("Total_qnas:", len(qnas), [qna.score for qna in qnas])
     qnas = [qna for qna in qnas if qna.score < 0.49]
     print("Filtered_qnas:", len(qnas))
 conversation_folder = f"conversations/{random.randint(0, 10000)}"
 ensure_dir(conversation_folder)
+print("Conversation", conversation_folder)
 SYSTEM_PROMPT = (
     "You are a question answering assistant.\n"
     chat_messages = history["chat_messages"]
+    qnas = query_database(user_query)
+    # Try to match an already existing question
+    if any(qna.score < 0.15 for qna in qnas):
+        min_score = min(qna.score for qna in qnas)
+        qna_minscore = [qna for qna in qnas if qna.score == min_score][0]
+        uid: str = qna_minscore.uid
+        mp3_path = os.path.join("audio", f"{uid}.mp3")
+        if not os.path.exists(mp3_path):
+            text_to_speech_polly(qna_minscore.answer, qna_minscore.language, mp3_path)
+        chat_messages.append({"role": "user", "content": user_query})
+        chat_messages.append({"role": "assistant", "content": qna_minscore.answer})
+        return {
+            "type": "cached_response",
+            "mp3_path": mp3_path,
+            "bot_response": qna_minscore.answer,
+            "prompt": "No chatbot response, cached response from database",
+        }
+    # Search only the base images
+    qnas = query_database(user_query, filters={"source": "base"})
+    # Use chatgpt to answer the question
+    path = os.path.join(conversation_folder, f"step_{step}_qna.json")
+    prompt = f"The user said: ---{user_query}---\n\n"
     context = context_format(qnas)
     prompt += context
+    chat_messages.append({"role": "user", "content": user_query})
     completion = openai.ChatCompletion.create(
+        model="gpt-4", messages=chat_messages, temperature=0
     )
     response_message = completion["choices"][0]["message"]
     path = os.path.join(conversation_folder, f"step_{step}_qna.json")
+    # remove the last message
+    chat_messages.pop(-1)
+    chat_messages.append({"role": "user", "content": user_query})
+    chat_messages.append({"role": "assistant", "content": bot_response})
     with open(path, "w") as f:
         json.dump(
             {
             indent=4,
         )
     step += 1
+    data = {
+        "type": "openai",
+        "bot_response": bot_response,
+        "prompt": prompt,
+    }
+    return data
+def add_question(question):
+    if os.path.exists("runtime_questions.json"):
+        with open("runtime_questions.json") as f:
+            questions = json.load(f)
+    else:
+        questions = []
+    questions.append(question)
+    with open("runtime_questions.json", "w") as f:
+        json.dump(questions, f, indent=4, ensure_ascii=False)
 import random
     return conversation_string
+if not os.path.exists("runtime_questions.json"):
+    with open("runtime_questions.json", "w") as f:
+        json.dump([], f)
 def handle_audiofile(audio_filepath: str, history: list):
     user_question = whisper_transcription(audio_filepath)
     print("Transcription", user_question)
+    res = bot_respond(user_question, history)
+    if res["type"] == "cached_response":
+        return (
+            user_question,
+            res["bot_response"],
+            history,
+            res["prompt"],
+            display_history(history["chat_messages"]),
+            res["mp3_path"],
+        )
+    else:
+        bot_response_text = res["bot_response"]
+        prompt = res["prompt"]
     if bot_response_text:
         lang = detect(bot_response_text)
     else:
         lang = "en"
+    add_question(
+        {"question": user_question, "answer": bot_response_text, "language": lang}
+    )
     if lang not in ["en", "de"]:
         lang = "en"
+    output_filepath = os.path.join(
+        "audio_temp", f"output_{random.randint(0, 1000)}.mp3"
+    )
     text_to_speech_polly(bot_response_text, lang, output_filepath)
+    context_prompt = prompt
     context_prompt += f"<<tts language>> : {lang}\n"
     context_prompt += f"<<tts text>> : {bot_response_text}\n"
         context_prompt,
         display_history(history["chat_messages"]),
         output_filepath,
+        "runtime_questions.json",
     )
         )
         conversation_history = gr.Textbox(label="Conversation history")
+    with gr.Row():
+        file_output = gr.File(label="Download questions file", download=True)
     # when the audio input is stopped, run the transcribe function
     audio_input.stop_recording(
         handle_audiofile,
             context_info,
             conversation_history,
             output_audio,
+            file_output,
         ],
     )
 username = os.environ["GRADIO_USERNAME"]
 password = os.environ["GRADIO_PASSWORD"]

audio/0014ea63-6970-447d-9f37-d7ec600f2a18.mp3 ADDED Viewed

Binary file (55.8 kB). View file

audio/0040266e-5e79-41dd-943d-e8b414be79b9.mp3 ADDED Viewed

Binary file (29.6 kB). View file

audio/007de689-48fa-4ad4-924e-a32b5604a669.mp3 ADDED Viewed

Binary file (88.2 kB). View file

audio/00dd1484-fa96-4edd-b2c0-67a36e72814b.mp3 ADDED Viewed

Binary file (22.7 kB). View file

audio/014d0e79-346a-4184-aa0c-fde1d6cad727.mp3 ADDED Viewed

Binary file (38.3 kB). View file

audio/01679648-46e1-4b8d-bac4-a4efc1c03f4e.mp3 ADDED Viewed

Binary file (47.1 kB). View file

audio/01cb8d82-b08a-4a9e-b6fb-0d23d1b1d620.mp3 ADDED Viewed

Binary file (65.9 kB). View file

audio/0235968b-0e0e-427f-a053-d77b184d1217.mp3 ADDED Viewed

Binary file (32.2 kB). View file

audio/02869a46-696d-4545-8286-328b2bf9c38f.mp3 ADDED Viewed

Binary file (44.1 kB). View file

audio/03481c4a-b5bd-4cfd-b2a0-ed6e257e4612.mp3 ADDED Viewed

Binary file (155 kB). View file

audio/034e0813-b5a0-4b2b-ab22-beeda411b23b.mp3 ADDED Viewed

Binary file (43.1 kB). View file

audio/0387ccf5-bc33-4b3d-bca3-b7659b9d4541.mp3 ADDED Viewed

Binary file (26.1 kB). View file

audio/03c1a729-f086-4874-8543-8e319c8c0a38.mp3 ADDED Viewed

Binary file (103 kB). View file

audio/03dc1ece-261b-4368-b86b-144738bb9ed3.mp3 ADDED Viewed

Binary file (26.8 kB). View file

audio/0480beb7-4513-4d37-8745-c0b0916f2f11.mp3 ADDED Viewed

Binary file (44 kB). View file

audio/0552041a-5470-4a4e-b758-fcc96d5d5721.mp3 ADDED Viewed

Binary file (145 kB). View file

audio/060eb813-521d-4db8-8260-4d1f34b65694.mp3 ADDED Viewed

Binary file (61.2 kB). View file

audio/06497605-8980-411a-b885-ce688aa791eb.mp3 ADDED Viewed

Binary file (39.8 kB). View file

audio/064a1cd8-0317-4084-a7f4-cc62c501eb25.mp3 ADDED Viewed

Binary file (80.8 kB). View file

audio/066d87df-72a7-4637-8253-1290effb8d3a.mp3 ADDED Viewed

Binary file (52.2 kB). View file

audio/067bb319-ede8-4c58-990e-a14f4a76bfc7.mp3 ADDED Viewed

Binary file (48.3 kB). View file

audio/068bb98d-7be4-47bc-87f5-bfa56fc6414f.mp3 ADDED Viewed

Binary file (28.4 kB). View file

audio/06ecc371-3970-4350-8715-ac9bbf503c2f.mp3 ADDED Viewed

Binary file (34.3 kB). View file

audio/07042220-5613-427c-8d8b-4b4586e6cb1a.mp3 ADDED Viewed

Binary file (78.1 kB). View file

audio/074edb8e-3c8b-45f9-86fb-8b35bddfe92d.mp3 ADDED Viewed

Binary file (31.7 kB). View file

audio/0794c21d-b363-4dcc-974d-85ec010a6fe2.mp3 ADDED Viewed

Binary file (30.3 kB). View file

audio/07d14014-aa0a-4646-9a14-03c444e173c3.mp3 ADDED Viewed

Binary file (32 kB). View file

audio/07f8546c-cf3d-4893-b904-5afb3127dc77.mp3 ADDED Viewed

Binary file (86.4 kB). View file

audio/0841bbb2-da04-4fd3-acad-5348ec85c912.mp3 ADDED Viewed

Binary file (22.9 kB). View file

audio/088385df-9037-4047-bda7-ebc32886aed3.mp3 ADDED Viewed

Binary file (29 kB). View file

audio/08e4286a-e5a4-4de9-9221-dd777f685078.mp3 ADDED Viewed

Binary file (37.1 kB). View file

audio/08f5081b-7d12-47d7-bf12-d41e645a4ef6.mp3 ADDED Viewed

Binary file (35 kB). View file

audio/08f6c839-018a-4e7f-802c-29ac819ef0d1.mp3 ADDED Viewed

Binary file (74.8 kB). View file

audio/09ae3b98-7857-4505-aef6-445819aa4f92.mp3 ADDED Viewed

Binary file (183 kB). View file

audio/09b2d932-cba9-4192-b356-a2c27f964055.mp3 ADDED Viewed

Binary file (46.7 kB). View file

audio/0a047afb-a55f-4d3d-8082-513fec3507cf.mp3 ADDED Viewed

Binary file (37.1 kB). View file

audio/0a0fb2fd-ab1c-47a8-98c2-8af70f81c191.mp3 ADDED Viewed

Binary file (131 kB). View file

audio/0a3972f3-17b4-4207-97d7-2e4df35777a3.mp3 ADDED Viewed

Binary file (44.4 kB). View file

audio/0a68b75c-59b2-45a8-9fe1-2ebc8638685b.mp3 ADDED Viewed

Binary file (77.9 kB). View file

audio/0a92c22e-1167-444b-a8dd-e9a544bed022.mp3 ADDED Viewed

Binary file (139 kB). View file

audio/0a9e947f-8ae3-4eaf-b2cf-178e8f4d1f52.mp3 ADDED Viewed

Binary file (67.3 kB). View file

audio/0ad73ebb-db96-48d4-b428-36ee00b29ae8.mp3 ADDED Viewed

Binary file (25.8 kB). View file

audio/0aebd9f7-7cd3-4c3d-aef1-eaa05e54d6ee.mp3 ADDED Viewed

Binary file (35.2 kB). View file

audio/0b522ac8-4e0f-4dab-9f93-7571525ffb74.mp3 ADDED Viewed

Binary file (91.9 kB). View file

audio/0c1552e3-b333-47cc-bee7-5149c01c85e4.mp3 ADDED Viewed

Binary file (222 kB). View file

audio/0c2e0437-761c-4cdc-9874-ddbd7ffe03e0.mp3 ADDED Viewed

Binary file (37.8 kB). View file