Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -13,7 +13,7 @@ token_huggingface = os.getenv("HUGGINGFACE_TOKEN")
|
|
13 |
hf_hub_download(
|
14 |
repo_id="bartowski/gemma-2-2b-it-abliterated-GGUF",
|
15 |
filename="gemma-2-2b-it-abliterated-Q4_K_M.gguf",
|
16 |
-
local_dir="./
|
17 |
token=token_huggingface
|
18 |
)
|
19 |
|
@@ -36,7 +36,7 @@ def responder(
|
|
36 |
|
37 |
if llm is None:
|
38 |
llm = Llama(
|
39 |
-
model_path="
|
40 |
flash_attn=True,
|
41 |
n_gpu_layers=81,
|
42 |
n_batch=1024,
|
|
|
13 |
hf_hub_download(
|
14 |
repo_id="bartowski/gemma-2-2b-it-abliterated-GGUF",
|
15 |
filename="gemma-2-2b-it-abliterated-Q4_K_M.gguf",
|
16 |
+
local_dir="./models",
|
17 |
token=token_huggingface
|
18 |
)
|
19 |
|
|
|
36 |
|
37 |
if llm is None:
|
38 |
llm = Llama(
|
39 |
+
model_path="models/gemma-2-2b-it-abliterated-Q4_K_M.gguf",
|
40 |
flash_attn=True,
|
41 |
n_gpu_layers=81,
|
42 |
n_batch=1024,
|