wangchanberta-th-qa

Sleeping

App Files Files Community

Chananchida commited on Feb 19, 2024

Commit

7501763

verified ·

1 Parent(s): bf56fe9

Update app.py

Browse files

Files changed (1) hide show

app.py +37 -12

app.py CHANGED Viewed

@@ -11,8 +11,6 @@ from transformers import AutoTokenizer, AutoModelForQuestionAnswering
 from sentence_transformers import SentenceTransformer,util
 from pythainlp import Tokenizer
 import pickle
-import evaluate
-from sklearn.metrics.pairwise import cosine_similarity,euclidean_distances
 import gradio as gr
 print(torch.cuda.is_available())
@@ -148,14 +146,41 @@ class Chatbot:
         question_vector = self.get_embeddings(message)
         question_vector=self.prepare_sentences_vector([question_vector])
         similar_questions, similar_contexts, distances,indices = self.faiss_search(question_vector)
-        Answer = self.model_pipeline(similar_questions, similar_contexts)
-        return Answer
-bot = ChatbotModel()
 """#Gradio"""
-# EXAMPLE = ["หลิน ไห่เฟิง มีชื่อเรียกอีกชื่อว่าอะไร" , "ใครเป็นผู้ตั้งสภาเศรษฐกิจโลกขึ้นในปี พ.ศ. 2514 โดยทุกปีจะมีการประชุมที่ประเทศสวิตเซอร์แลนด์", "โปรดิวเซอร์ของอัลบั้มตลอดกาล ของวงคีรีบูนคือใคร", "สกุลเดิมของหม่อมครูนุ่ม นวรัตน ณ อยุธยา คืออะไร"]
-demo = gr.Interface(fn=bot._chatbot.predict, inputs="text", outputs="text", title="CE66-04_Thai Question Answering System by using Deep Learning")
-demo.launch()

 from sentence_transformers import SentenceTransformer,util
 from pythainlp import Tokenizer
 import pickle
 import gradio as gr
 print(torch.cuda.is_available())
         question_vector = self.get_embeddings(message)
         question_vector=self.prepare_sentences_vector([question_vector])
         similar_questions, similar_contexts, distances,indices = self.faiss_search(question_vector)
+        Answer = self.model_pipeline(message, similar_contexts)
+        start_index = similar_contexts.find(Answer)
+        end_index = start_index + len(Answer)
+        _time = time.time() - t
+        output = {
+            "user_question": message,
+            "answer": df['Answer'][indices[0][0]],
+            "totaltime": round(_time, 3),
+            "distance": round(distances[0][0], 4),
+            "highlight_start": start_index,
+            "highlight_end": end_index
+        }
+        return output
+def highlight_text(text, start_index, end_index):
+    if start_index < 0:
+        start_index = 0
+    if end_index > len(text):
+        end_index = len(text)
+    highlighted_text = ""
+    for i, char in enumerate(text):
+         if i == start_index:
+            highlighted_text += "<mark>"
+        highlighted_text += char
+        if i == end_index - 1:
+            highlighted_text += "</mark>"
+    return highlighted_text
 """#Gradio"""
+if __name__ == "__main__":
+    bot = ChatbotModel()
+    def chat_interface(question, history):
+        response = bot._chatbot.predict(model, tokenizer, embedding_model, df, question, index)
+        highlighted_answer = highlight_text(response["answer"], response["highlight_start"], response["highlight_end"])
+        return highlighted_answer
+    # EXAMPLE = ["หลิน ไห่เฟิง มีชื่อเรียกอีกชื่อว่าอะไร" , "ใครเป็นผู้ตั้งสภาเศรษฐกิจโลกขึ้นในปี พ.ศ. 2514 โดยทุกปีจะมีการประชุมที่ประเทศสวิตเซอร์แลนด์", "โปรดิวเซอร์ของอัลบั้มตลอดกาล ของวงคีรีบูนคือใคร", "สกุลเดิมของหม่อมครูนุ่ม นวรัตน ณ อยุธยา คืออะไร"]
+    demo = gr.ChatInterface(fn=chat_interface, title="CE66-04_Thai Question Answering System by using Deep Learning")
+    demo.launch()