Spaces:
Sleeping
Sleeping
File size: 4,445 Bytes
48a15e4 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 |
import streamlit as st
from langchain.document_loaders import PyPDFLoader
from langchain.vectorstores import FAISS
from langchain.embeddings import HuggingFaceEmbeddings
from langchain.chains import RetrievalQA
from langchain.llms import OpenAI
from langchain.llms import HuggingFaceHub
# from langchain import HuggingFaceHub
if "responses" not in st.session_state:
st.session_state.responses = []
if "questions" not in st.session_state:
st.session_state.questions = []
def app():
st.set_page_config(
page_title="Chat with AI",
page_icon="🤖",
layout="centered"
)
st.title("Chat with AI")
st.markdown(":violet[Get Huggingface API Read Token or Open AI API Key]")
st.markdown("#### Select an Option")
Option = st.selectbox(
label="Select the model",
options=(
"Select the model",
"HuggingFace(Uses Falcon 4b Model)",
"OpenAI"
),
label_visibility="collapsed"
)
if Option != "Select the model":
st.markdown("#### Enter your " + Option + " API key")
API = st.text_input(
"Enter your " + Option + " API key",
label_visibility="collapsed"
)
if API != "":
st.markdown("#### Upload a document")
doc = st.file_uploader("Upload a document", type=["pdf"], label_visibility="collapsed")
if doc is not None:
with open("doc.pdf", "wb") as f:
f.write(doc.getbuffer())
loader = PyPDFLoader("doc.pdf")
pages = loader.load_and_split()
embeddings = HuggingFaceEmbeddings(
model_name="all-MiniLM-L6-v2"
)
faiss_index = FAISS.from_documents(pages, embeddings)
llm = OpenAI(open_api_key=API) if Option == "OpenAI" else (
HuggingFaceHub(
repo_id="tiiuae/falcon-7b-instruct",
model_kwargs={
"temperature": 0.5,
"max_new_tokens": 500
},
huggingfacehub_api_token=API,
)
)
qa = RetrievalQA.from_chain_type(
llm=llm,
chain_type="stuff",
retriever=faiss_index.as_retriever(
search_type="mmr",
search_kwargs={'fetch_k': 10}),
return_source_documents=True
)
container = st.container()
st.write("Ask Your Question Here")
question = st.text_input(
"Ask your question here",
label_visibility="collapsed"
)
with container:
with st.chat_message("assistant"):
st.write("How can I help you?")
if question != "":
response = qa(question)
st.session_state.responses.insert(0, response)
st.session_state.questions.insert(0, question)
for i in range(len(st.session_state.responses)):
with st.chat_message("user"):
st.write(st.session_state.questions[i - 1])
with st.chat_message("assistant"):
with st.expander(
"Response (Click here to collapse)",
expanded=True
):
result = st.session_state.responses[i]
st.write(result['result'])
st.write("Source documents: "
"(Most relevant are first)")
for i in result['source_documents']:
with st.expander(
"Page: " + str(i.metadata['page'])
):
st.write(i.page_content)
st.divider()
if __name__ == "__main__":
app()
|