Spaces:
Running
Running
add LLama2-70b
Browse files- streamlit_app.py +20 -7
streamlit_app.py
CHANGED
@@ -57,6 +57,11 @@ def init_qa(model):
|
|
57 |
model_kwargs={"temperature": 0.01, "max_length": 4096, "max_new_tokens": 2048})
|
58 |
embeddings = HuggingFaceEmbeddings(
|
59 |
model_name="all-MiniLM-L6-v2")
|
|
|
|
|
|
|
|
|
|
|
60 |
|
61 |
return DocumentQAEngine(chat, embeddings, grobid_url=os.environ['GROBID_URL'])
|
62 |
|
@@ -82,26 +87,31 @@ def play_old_messages():
|
|
82 |
else:
|
83 |
st.write(message['content'])
|
84 |
|
|
|
85 |
is_api_key_provided = st.session_state['api_key']
|
86 |
|
87 |
-
model = st.sidebar.radio("Model (cannot be changed after selection or upload)",
|
|
|
88 |
index=1,
|
89 |
captions=[
|
90 |
"ChatGPT 3.5 Turbo + Ada-002-text (embeddings)",
|
91 |
-
"Mistral-7B-Instruct-V0.1 + Sentence BERT (embeddings)"
|
|
|
92 |
],
|
93 |
help="Select the model you want to use.",
|
94 |
disabled=is_api_key_provided)
|
95 |
|
96 |
if not st.session_state['api_key']:
|
97 |
-
if model == 'mistral-7b-instruct-v0.1':
|
98 |
-
api_key = st.sidebar.text_input('Huggingface API Key') if 'HUGGINGFACEHUB_API_TOKEN' not in os.environ else
|
|
|
99 |
if api_key:
|
100 |
st.session_state['api_key'] = is_api_key_provided = True
|
101 |
os.environ["HUGGINGFACEHUB_API_TOKEN"] = api_key
|
102 |
st.session_state['rqa'] = init_qa(model)
|
103 |
elif model == 'chatgpt-3.5-turbo':
|
104 |
-
api_key = st.sidebar.text_input('OpenAI API Key') if 'OPENAI_API_KEY' not in os.environ else os.environ[
|
|
|
105 |
if api_key:
|
106 |
st.session_state['api_key'] = is_api_key_provided = True
|
107 |
os.environ['OPENAI_API_KEY'] = api_key
|
@@ -137,7 +147,8 @@ question = st.chat_input(
|
|
137 |
with st.sidebar:
|
138 |
st.header("Documentation")
|
139 |
st.markdown("https://github.com/lfoppiano/document-qa")
|
140 |
-
st.markdown(
|
|
|
141 |
|
142 |
st.markdown(
|
143 |
"""After uploading, please wait for the PDF to be processed. You will see a spinner or loading indicator while the processing is in progress. Once the spinner stops, you can proceed to ask your questions.""")
|
@@ -158,7 +169,9 @@ if uploaded_file and not st.session_state.loaded_embeddings:
|
|
158 |
tmp_file = NamedTemporaryFile()
|
159 |
tmp_file.write(bytearray(binary))
|
160 |
# hash = get_file_hash(tmp_file.name)[:10]
|
161 |
-
st.session_state['doc_id'] = hash = st.session_state['rqa'].create_memory_embeddings(tmp_file.name,
|
|
|
|
|
162 |
st.session_state['loaded_embeddings'] = True
|
163 |
|
164 |
# timestamp = datetime.utcnow()
|
|
|
57 |
model_kwargs={"temperature": 0.01, "max_length": 4096, "max_new_tokens": 2048})
|
58 |
embeddings = HuggingFaceEmbeddings(
|
59 |
model_name="all-MiniLM-L6-v2")
|
60 |
+
elif model == 'llama-2-70b-chat':
|
61 |
+
chat = HuggingFaceHub(repo_id="meta-llama/Llama-2-70b-chat-hf",
|
62 |
+
model_kwargs={"temperature": 0.01, "max_length": 4096, "max_new_tokens": 2048})
|
63 |
+
embeddings = HuggingFaceEmbeddings(
|
64 |
+
model_name="all-MiniLM-L6-v2")
|
65 |
|
66 |
return DocumentQAEngine(chat, embeddings, grobid_url=os.environ['GROBID_URL'])
|
67 |
|
|
|
87 |
else:
|
88 |
st.write(message['content'])
|
89 |
|
90 |
+
|
91 |
is_api_key_provided = st.session_state['api_key']
|
92 |
|
93 |
+
model = st.sidebar.radio("Model (cannot be changed after selection or upload)",
|
94 |
+
("chatgpt-3.5-turbo", "mistral-7b-instruct-v0.1", "llama-2-70b-chat"),
|
95 |
index=1,
|
96 |
captions=[
|
97 |
"ChatGPT 3.5 Turbo + Ada-002-text (embeddings)",
|
98 |
+
"Mistral-7B-Instruct-V0.1 + Sentence BERT (embeddings)",
|
99 |
+
"LLama2-70B-Chat + Sentence BERT (embeddings)",
|
100 |
],
|
101 |
help="Select the model you want to use.",
|
102 |
disabled=is_api_key_provided)
|
103 |
|
104 |
if not st.session_state['api_key']:
|
105 |
+
if model == 'mistral-7b-instruct-v0.1' or 'llama-2-70b-chat':
|
106 |
+
api_key = st.sidebar.text_input('Huggingface API Key') if 'HUGGINGFACEHUB_API_TOKEN' not in os.environ else \
|
107 |
+
os.environ['HUGGINGFACEHUB_API_TOKEN']
|
108 |
if api_key:
|
109 |
st.session_state['api_key'] = is_api_key_provided = True
|
110 |
os.environ["HUGGINGFACEHUB_API_TOKEN"] = api_key
|
111 |
st.session_state['rqa'] = init_qa(model)
|
112 |
elif model == 'chatgpt-3.5-turbo':
|
113 |
+
api_key = st.sidebar.text_input('OpenAI API Key') if 'OPENAI_API_KEY' not in os.environ else os.environ[
|
114 |
+
'OPENAI_API_KEY']
|
115 |
if api_key:
|
116 |
st.session_state['api_key'] = is_api_key_provided = True
|
117 |
os.environ['OPENAI_API_KEY'] = api_key
|
|
|
147 |
with st.sidebar:
|
148 |
st.header("Documentation")
|
149 |
st.markdown("https://github.com/lfoppiano/document-qa")
|
150 |
+
st.markdown(
|
151 |
+
"""After entering your API Key (Open AI or Huggingface). Upload a scientific article as PDF document, click on the designated button and select the file from your device.""")
|
152 |
|
153 |
st.markdown(
|
154 |
"""After uploading, please wait for the PDF to be processed. You will see a spinner or loading indicator while the processing is in progress. Once the spinner stops, you can proceed to ask your questions.""")
|
|
|
169 |
tmp_file = NamedTemporaryFile()
|
170 |
tmp_file.write(bytearray(binary))
|
171 |
# hash = get_file_hash(tmp_file.name)[:10]
|
172 |
+
st.session_state['doc_id'] = hash = st.session_state['rqa'].create_memory_embeddings(tmp_file.name,
|
173 |
+
chunk_size=250,
|
174 |
+
perc_overlap=0.1)
|
175 |
st.session_state['loaded_embeddings'] = True
|
176 |
|
177 |
# timestamp = datetime.utcnow()
|