desert
commited on
Commit
·
2936c26
1
Parent(s):
346af9c
init inference
Browse files
app.py
CHANGED
|
@@ -1,8 +1,12 @@
|
|
| 1 |
import gradio as gr
|
| 2 |
from llama_cpp import Llama
|
|
|
|
| 3 |
|
| 4 |
-
#
|
| 5 |
-
|
|
|
|
|
|
|
|
|
|
| 6 |
|
| 7 |
# Load the GGUF model using llama-cpp-python
|
| 8 |
print("Loading model...")
|
|
|
|
| 1 |
import gradio as gr
|
| 2 |
from llama_cpp import Llama
|
| 3 |
+
from huggingface_hub import hf_hub_download
|
| 4 |
|
| 5 |
+
# Model identifier from Hugging Face
|
| 6 |
+
model_repo = "Mat17892/lora_llama_gguf_g14" # Hugging Face model ID
|
| 7 |
+
|
| 8 |
+
# Download the GGUF file from Hugging Face
|
| 9 |
+
model_path = hf_hub_download(repo_id=model_repo, filename="llama_lora_model.gguf")
|
| 10 |
|
| 11 |
# Load the GGUF model using llama-cpp-python
|
| 12 |
print("Loading model...")
|