Spaces:

vidhiparikh
/

About-Me

Sleeping

vidhiparikh commited on Mar 13

Commit

1bc21a7

•

1 Parent(s): 436241a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -75,8 +75,8 @@ callback_manager = CallbackManager([StreamingStdOutCallbackHandler()])
 # Function to create a conversational chain
 def create_conversational_chain(database):
     llama_llm = LlamaCpp(
-        # Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.
-        llm = AutoModelForCausalLM.from_pretrained("TheBloke/Llama-2-7b-Chat-GGUF", model_file="llama-2-7b-chat.q4_K_M.gguf", model_type="llama", gpu_layers=0),
         temperature=0.75,
         max_tokens=200,
         top_p=1,

 # Function to create a conversational chain
 def create_conversational_chain(database):
     llama_llm = LlamaCpp(
+        # Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system. llama-2-7b-chat.Q8_0.gguf
+        llm = AutoModelForCausalLM.from_pretrained("TheBloke/Llama-2-7b-Chat-GGUF", model_file="llama-2-7b-chat.Q8_0.gguf", model_type="llama", gpu_layers=0),
         temperature=0.75,
         max_tokens=200,
         top_p=1,