WebSearchLLM

Runtime error

App Files Files Community

cnmoro commited on Feb 14

Commit

99b37ed

•

1 Parent(s): 2d3a993

Upload app.py

Browse files

Files changed (1) hide show

app.py +9 -7

app.py CHANGED Viewed

@@ -1,4 +1,4 @@
-import time, aiohttp, asyncio, json, os, multiprocessing
 from minivectordb.embedding_model import EmbeddingModel
 from minivectordb.vector_database import VectorDatabase
 from text_util_en_pt.cleaner import structurize_text, detect_language, Language
@@ -6,15 +6,17 @@ from webtextcrawler.webtextcrawler import extract_text_from_url
 from duckduckgo_search import DDGS
 import gradio as gr
 openrouter_key = os.environ.get("OPENROUTER_KEY")
-model = EmbeddingModel(use_quantized_onnx_model=False, e5_model_size='small')
-def fetch_links(query, max_results=10):
     with DDGS() as ddgs:
         return [r['href'] for r in ddgs.text(query, max_results=max_results)]
 def fetch_texts(links):
-    with multiprocessing.Pool() as pool:
         texts = pool.map(extract_text_from_url, links)
     return '\n'.join([t for t in texts if t])
@@ -34,7 +36,7 @@ def index_and_search(query, text):
     # Retrieval
     start = time.time()
-    search_results = vector_db.find_most_similar(query_embedding, k = 10)
     retrieval_time = time.time() - start
     return '\n'.join([s['sentence'] for s in search_results[2]]), embedding_time, retrieval_time
@@ -117,13 +119,13 @@ async def predict(message, history):
 # Setting up the Gradio chat interface.
 gr.ChatInterface(
     predict,
-    title="AI Web Search",
     description="Ask any question, and I will try to answer it using web search !",
     retry_btn=None,
     undo_btn=None,
     examples=[
         'When did the first human land on the moon?',
-        'Liquid vs solid vs gas ?',
         'What is the capital of France?',
         'Why does Brazil has a high tax rate?'
     ]

+import time, aiohttp, asyncio, json, os, multiprocessing, torch
 from minivectordb.embedding_model import EmbeddingModel
 from minivectordb.vector_database import VectorDatabase
 from text_util_en_pt.cleaner import structurize_text, detect_language, Language
 from duckduckgo_search import DDGS
 import gradio as gr
+torch.set_num_threads(2)
 openrouter_key = os.environ.get("OPENROUTER_KEY")
+model = EmbeddingModel(use_quantized_onnx_model=True)
+def fetch_links(query, max_results=5):
     with DDGS() as ddgs:
         return [r['href'] for r in ddgs.text(query, max_results=max_results)]
 def fetch_texts(links):
+    with multiprocessing.Pool(5) as pool:
         texts = pool.map(extract_text_from_url, links)
     return '\n'.join([t for t in texts if t])
     # Retrieval
     start = time.time()
+    search_results = vector_db.find_most_similar(query_embedding, k = 12)
     retrieval_time = time.time() - start
     return '\n'.join([s['sentence'] for s in search_results[2]]), embedding_time, retrieval_time
 # Setting up the Gradio chat interface.
 gr.ChatInterface(
     predict,
+    title="Web Search with LLM !",
     description="Ask any question, and I will try to answer it using web search !",
     retry_btn=None,
     undo_btn=None,
     examples=[
         'When did the first human land on the moon?',
+        'Liquid vs solid vs gas?',
         'What is the capital of France?',
         'Why does Brazil has a high tax rate?'
     ]