Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -13,7 +13,7 @@ token_huggingface = os.getenv("HUGGINGFACE_TOKEN")
|
|
| 13 |
hf_hub_download(
|
| 14 |
repo_id="bartowski/gemma-2-2b-it-abliterated-GGUF",
|
| 15 |
filename="gemma-2-2b-it-abliterated-Q4_K_M.gguf",
|
| 16 |
-
local_dir="./
|
| 17 |
token=token_huggingface
|
| 18 |
)
|
| 19 |
|
|
@@ -36,7 +36,7 @@ def responder(
|
|
| 36 |
|
| 37 |
if llm is None:
|
| 38 |
llm = Llama(
|
| 39 |
-
model_path="
|
| 40 |
flash_attn=True,
|
| 41 |
n_gpu_layers=81,
|
| 42 |
n_batch=1024,
|
|
|
|
| 13 |
hf_hub_download(
|
| 14 |
repo_id="bartowski/gemma-2-2b-it-abliterated-GGUF",
|
| 15 |
filename="gemma-2-2b-it-abliterated-Q4_K_M.gguf",
|
| 16 |
+
local_dir="./models",
|
| 17 |
token=token_huggingface
|
| 18 |
)
|
| 19 |
|
|
|
|
| 36 |
|
| 37 |
if llm is None:
|
| 38 |
llm = Llama(
|
| 39 |
+
model_path="models/gemma-2-2b-it-abliterated-Q4_K_M.gguf",
|
| 40 |
flash_attn=True,
|
| 41 |
n_gpu_layers=81,
|
| 42 |
n_batch=1024,
|