Spaces:

peterpeter8585
/

syai4.1

Running

peterpeter8585 commited on 10 days ago

Commit

90de6d2

verified ·

1 Parent(s): 3b6cd5e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -94,9 +94,7 @@ llm = ChatLlamaCpp(
     temperature=0,
     model_path="./llama-3-open-ko-8b-instruct-preview-q5_k_m.gguf",
     n_ctx=10000,
-    n_gpu_layers=8,
     n_batch=300,  # Should be between 1 and n_ctx, consider the amount of VRAM in your GPU.
-    max_tokens=512,
     n_threads=multiprocessing.cpu_count() - 1,
     repeat_penalty=1.5,
     top_p=0.5,

     temperature=0,
     model_path="./llama-3-open-ko-8b-instruct-preview-q5_k_m.gguf",
     n_ctx=10000,
     n_batch=300,  # Should be between 1 and n_ctx, consider the amount of VRAM in your GPU.
     n_threads=multiprocessing.cpu_count() - 1,
     repeat_penalty=1.5,
     top_p=0.5,