Spaces:
Running
Running
import os | |
import chromadb | |
import gradio as gr | |
from openai import AzureOpenAI | |
from langchain_huggingface import HuggingFaceEmbeddings | |
from langchain_community.vectorstores import Chroma | |
from typing import List | |
qna_system_message = """ | |
You are an assistant to an insurance firm who answers customer queries based on their insurance policy documents. | |
User input will have the context required by you to answer customer questions. | |
This context will begin with the word: ###Context. | |
The context contains references to specific portions of a document relevant to the customer query. | |
Customer questions will begin with the word: ###Question. | |
Information about the customer will begin with the word: ###Customer Information | |
Please answer user questions ONLY using the context provided in the input and the customer information. | |
DO NOT mention anything about the context in your final answer. | |
Your response should only contain the answer to the question AND NOTHING ELSE. | |
If the answer is not found in the context, respond "Sorry, I cannot answer your question at this point. Please contact our hotline: 1-800-INSURANCE". | |
""" | |
qna_user_message_template = """ | |
###Customer Information | |
Customer Name: John Doe | |
Username: johndoe | |
Policy Number: NBHTGBP22011V012223# | |
Bank Account Number: 424242424242 | |
Premium Amount: $15000 | |
Number of premium installments: 5 | |
Number of installments paid: 3 | |
Last Premium Paid: Yes | |
Last Premium Date: 2024-05-12 | |
###Context | |
Here are some documents that are relevant to the question mentioned below. | |
{context} | |
###Question | |
{question} | |
""" | |
client = AzureOpenAI( | |
api_key=os.environ["AZURE_OPENAI_KEY"], | |
azure_endpoint=os.environ["AZURE_OPENAI_ENDPOINT"], | |
api_version="2024-02-01" | |
) | |
embedding_model = HuggingFaceEmbeddings(model_name='thenlper/gte-large') | |
qna_model = 'gpt-4o-mini' | |
chromadb_client = chromadb.PersistentClient(path='./health_policy_db') | |
vectorstore_persisted = Chroma( | |
client=chromadb_client, | |
collection_name="policy-text", | |
embedding_function=embedding_model | |
) | |
retriever = vectorstore_persisted.as_retriever( | |
search_type='similarity', | |
search_kwargs={'k': 5} | |
) | |
def predict(input: str, history): | |
""" | |
Predict the response of the chatbot and complete a running list of chat history. | |
""" | |
relevant_document_chunks = retriever.invoke(input) | |
context_list = [d.page_content for d in relevant_document_chunks] | |
context_for_query = "\n".join(context_list) | |
user_message = [{ | |
'role': 'user', | |
'content': qna_user_message_template.format( | |
context=context_for_query, | |
question=input | |
) | |
}] | |
prompt = [{'role':'system', 'content': qna_system_message}] | |
for entry in history: | |
prompt += ( | |
[{'role': 'user', 'content': entry[0]}] + | |
[{'role': 'assistant', 'content': entry[1]}] | |
) | |
final_prompt = prompt + user_message | |
try: | |
response = client.chat.completions.create( | |
model=qna_model, | |
messages=final_prompt, | |
temperature=0 | |
) | |
prediction = response.choices[0].message.content.strip() | |
except Exception as e: | |
prediction = "Sorry, I cannot answer your question at this point. Please contact our hotline: 1-800-INSURANCE" | |
return prediction | |
demo = gr.ChatInterface( | |
fn=predict, | |
examples=["Summarize key feaures of my policy", | |
"Did I pay my last premium? How many have I paid so far?", | |
"Are hospitalization charges included in my policy?" | |
], | |
cache_examples=False, | |
theme=gr.themes.Base(), | |
title="Know Your Health Insurance Policy Better", | |
description="Feel free to ask me any query you might have about your health insurance policy", | |
concurrency_limit=8, | |
show_progress="full" | |
) | |
demo.launch(auth=("johndoe", os.getenv('PASSWD'))) |