moriire commited on
Commit
608c192
·
verified ·
1 Parent(s): 1c75184

Update app/llm.py

Browse files
Files changed (1) hide show
  1. app/llm.py +3 -3
app/llm.py CHANGED
@@ -30,9 +30,9 @@ class ChatModel(BaseModel):
30
  mirostat_tau: float=4.0
31
  mirostat_eta: float=1.1
32
  llm_chat = llama_cpp.Llama.from_pretrained(
33
- repo_id="moriire/healthcare-ai-q8_0",
34
- filename="healthcare-ai-q8_0-unsloth.Q8_0.gguf",
35
- tokenizer=llama_cpp.llama_tokenizer.LlamaHFTokenizer.from_pretrained("moriire/healthcare-ai-q8_0"),
36
  verbose=False,
37
  n_ctx=256,
38
  n_gpu_layers=0,
 
30
  mirostat_tau: float=4.0
31
  mirostat_eta: float=1.1
32
  llm_chat = llama_cpp.Llama.from_pretrained(
33
+ repo_id="moriire/healthcare-ai-q4_k_m",
34
+ filename="*.gguf",
35
+ tokenizer=llama_cpp.llama_tokenizer.LlamaHFTokenizer.from_pretrained("moriire/healthcare-ai-q4_k_m"),
36
  verbose=False,
37
  n_ctx=256,
38
  n_gpu_layers=0,