desert
commited on
Commit
•
2936c26
1
Parent(s):
346af9c
init inference
Browse files
app.py
CHANGED
@@ -1,8 +1,12 @@
|
|
1 |
import gradio as gr
|
2 |
from llama_cpp import Llama
|
|
|
3 |
|
4 |
-
#
|
5 |
-
|
|
|
|
|
|
|
6 |
|
7 |
# Load the GGUF model using llama-cpp-python
|
8 |
print("Loading model...")
|
|
|
1 |
import gradio as gr
|
2 |
from llama_cpp import Llama
|
3 |
+
from huggingface_hub import hf_hub_download
|
4 |
|
5 |
+
# Model identifier from Hugging Face
|
6 |
+
model_repo = "Mat17892/lora_llama_gguf_g14" # Hugging Face model ID
|
7 |
+
|
8 |
+
# Download the GGUF file from Hugging Face
|
9 |
+
model_path = hf_hub_download(repo_id=model_repo, filename="llama_lora_model.gguf")
|
10 |
|
11 |
# Load the GGUF model using llama-cpp-python
|
12 |
print("Loading model...")
|