Spaces:

sambanovasystems
/

enterprise_knowledge_retriever

Runtime error

App Files Files Community

petrojm commited on Sep 25

Commit

3b758aa

•

1 Parent(s): e443083

changes to app

Browse files

Files changed (1) hide show

app.py +13 -12

app.py CHANGED Viewed

@@ -7,17 +7,17 @@ current_dir = os.path.dirname(os.path.abspath(__file__))
 from src.document_retrieval import DocumentRetrieval
 from utils.visual.env_utils import env_input_fields, initialize_env_variables, are_credentials_set, save_credentials
-from utils.parsing.sambaparse import parse_doc_universal # added Petro
 from utils.vectordb.vector_db import VectorDb
 CONFIG_PATH = os.path.join(current_dir,'config.yaml')
 PERSIST_DIRECTORY = os.path.join(current_dir,f"data/my-vector-db") # changed to current_dir
-def handle_userinput(user_question, conversation, history):
     if user_question:
         try:
             # Generate response
-            response = conversation.invoke({"question": user_question})
             # Append user message and response to chat history
             history = history + [(user_question, response["answer"])]
@@ -28,27 +28,27 @@ def handle_userinput(user_question, conversation, history):
     else:
         return history, ""
-def process_documents(files, document_retrieval, vectorstore, conversation, save_location=None):
     try:
         document_retrieval = DocumentRetrieval()
         _, _, text_chunks = parse_doc_universal(doc=files)
         print(text_chunks)
         embeddings = document_retrieval.load_embedding_model()
-        collection_name = 'ekr_default_collection' if not config['prod_mode'] else None
         vectorstore = document_retrieval.create_vector_store(text_chunks, embeddings, output_db=save_location, collection_name=collection_name)
         document_retrieval.init_retriever(vectorstore)
-        conversation = document_retrieval.get_qa_retrieval_chain()
         #input_disabled = False
-        return conversation, vectorstore, document_retrieval, "Complete! You can now ask questions."
     except Exception as e:
-        return conversation, vectorstore, document_retrieval, f"An error occurred while processing: {str(e)}"
 # Read config file
 with open(CONFIG_PATH, 'r') as yaml_file:
     config = yaml.safe_load(yaml_file)
 prod_mode = config.get('prod_mode', False)
-default_collection = 'ekr_default_collection'
 # Load env variables
 initialize_env_variables(prod_mode)
@@ -58,8 +58,9 @@ caution_text = """⚠️ Note: depending on the size of your document, this coul
 with gr.Blocks() as demo:
     vectorstore = gr.State()
-    conversation = gr.State()
     document_retrieval = gr.State()
     gr.Markdown("# Enterprise Knowledge Retriever",
             elem_id="title")
@@ -80,7 +81,7 @@ with gr.Blocks() as demo:
     gr.Markdown(caution_text)
     # Preprocessing events
-    process_btn.click(process_documents, inputs=[docs, document_retrieval, vectorstore, conversation], outputs=[conversation, vectorstore, document_retrieval, setup_output], concurrency_limit=10)
     # Step 3: Chat with your data
     gr.Markdown("## 3️⃣ Chat with your document")
@@ -90,7 +91,7 @@ with gr.Blocks() as demo:
     sources_output = gr.Textbox(label="Sources", visible=False)
     # Chatbot events
-    msg.submit(handle_userinput, inputs=[msg, conversation, chatbot], outputs=[chatbot, msg], queue=False)
     clear_btn.click(lambda: [None, ""], inputs=None, outputs=[chatbot, msg], queue=False)
 if __name__ == "__main__":

 from src.document_retrieval import DocumentRetrieval
 from utils.visual.env_utils import env_input_fields, initialize_env_variables, are_credentials_set, save_credentials
+from utils.parsing.sambaparse import parse_doc_universal # added
 from utils.vectordb.vector_db import VectorDb
 CONFIG_PATH = os.path.join(current_dir,'config.yaml')
 PERSIST_DIRECTORY = os.path.join(current_dir,f"data/my-vector-db") # changed to current_dir
+def handle_userinput(user_question, conversation_chain, history):
     if user_question:
         try:
             # Generate response
+            response = conversation_chain.invoke({"question": user_question})
             # Append user message and response to chat history
             history = history + [(user_question, response["answer"])]
     else:
         return history, ""
+def process_documents(files, collection_name, document_retrieval, vectorstore, conversation_chain, save_location=None):
     try:
         document_retrieval = DocumentRetrieval()
         _, _, text_chunks = parse_doc_universal(doc=files)
         print(text_chunks)
         embeddings = document_retrieval.load_embedding_model()
+        collection_name = 'ekr_default_collection'
         vectorstore = document_retrieval.create_vector_store(text_chunks, embeddings, output_db=save_location, collection_name=collection_name)
         document_retrieval.init_retriever(vectorstore)
+        conversation_chain = document_retrieval.get_qa_retrieval_chain()
         #input_disabled = False
+        return conversation_chain, vectorstore, document_retrieval, collection_name, "Complete! You can now ask questions."
     except Exception as e:
+        return conversation_chain, vectorstore, document_retrieval, collection_name, f"An error occurred while processing: {str(e)}"
 # Read config file
 with open(CONFIG_PATH, 'r') as yaml_file:
     config = yaml.safe_load(yaml_file)
 prod_mode = config.get('prod_mode', False)
+#default_collection = 'ekr_default_collection'
 # Load env variables
 initialize_env_variables(prod_mode)
 with gr.Blocks() as demo:
     vectorstore = gr.State()
+    conversation_chain = gr.State()
     document_retrieval = gr.State()
+    collection_name=gr.State()
     gr.Markdown("# Enterprise Knowledge Retriever",
             elem_id="title")
     gr.Markdown(caution_text)
     # Preprocessing events
+    process_btn.click(process_documents, inputs=[docs, collection_name, document_retrieval, vectorstore, conversation_chain], outputs=[conversation_chain, vectorstore, document_retrieval, collection_name, setup_output], concurrency_limit=10)
     # Step 3: Chat with your data
     gr.Markdown("## 3️⃣ Chat with your document")
     sources_output = gr.Textbox(label="Sources", visible=False)
     # Chatbot events
+    msg.submit(handle_userinput, inputs=[msg, conversation_chain, chatbot], outputs=[chatbot, msg], queue=False)
     clear_btn.click(lambda: [None, ""], inputs=None, outputs=[chatbot, msg], queue=False)
 if __name__ == "__main__":