Spaces:

dkdaniz
/

katara

Paused

Daniel Marques commited on Oct 15, 2023

Commit

2453cc0

1 Parent(s): 08f602b

fix: add types

Files changed (2) hide show

load_models.py CHANGED Viewed

@@ -14,7 +14,6 @@ from transformers import (
     LlamaTokenizer,
     GenerationConfig,
     pipeline,
-    TextStreamer
 )

     LlamaTokenizer,
     GenerationConfig,
     pipeline,
 )

main.py CHANGED Viewed

@@ -31,7 +31,6 @@ class Predict(BaseModel):
 class Delete(BaseModel):
     filename: str
 class MyCustomAsyncHandler(AsyncCallbackHandler):
     def on_llm_new_token(self, token: str, **kwargs) -> None:
         print(f" token: {token}")
@@ -66,7 +65,7 @@ DB = Chroma(
 RETRIEVER = DB.as_retriever()
-LLM = load_model(device_type=DEVICE_TYPE, model_id=MODEL_ID, model_basename=MODEL_BASENAME, stream=True, callbacks = [MyCustomAsyncHandler])
 template = """you are a helpful, respectful and honest assistant. When answering questions, you should only use the documents provided.
 You should only answer the topics that appear in these documents.

 class Delete(BaseModel):
     filename: str
 class MyCustomAsyncHandler(AsyncCallbackHandler):
     def on_llm_new_token(self, token: str, **kwargs) -> None:
         print(f" token: {token}")
 RETRIEVER = DB.as_retriever()
+LLM = load_model(device_type=DEVICE_TYPE, model_id=MODEL_ID, model_basename=MODEL_BASENAME, stream=True, callbacks=[MyCustomAsyncHandler()])
 template = """you are a helpful, respectful and honest assistant. When answering questions, you should only use the documents provided.
 You should only answer the topics that appear in these documents.