chat-with-docs

Runtime error

herMaster commited on Jan 8, 2024

Commit

2e77c9f

1 Parent(s): 3f4c4d2

reduce model size

Files changed (1) hide show

app.py CHANGED Viewed

@@ -34,7 +34,7 @@ print("loading the LLM......................................")
 # )
 llm = AutoModelForCausalLM.from_pretrained("TheBloke/Llama-2-7B-Chat-GGUF",
-                                           model_file="llama-2-7b-chat.Q3_K_L.gguf",
                                            model_type="llama",
                                            temperature = 0.2,
                                            repetition_penalty = 1.5

 # )
 llm = AutoModelForCausalLM.from_pretrained("TheBloke/Llama-2-7B-Chat-GGUF",
+                                           model_file="llama-2-7b-chat.Q3_K_S.gguf",
                                            model_type="llama",
                                            temperature = 0.2,
                                            repetition_penalty = 1.5