Spaces:

hsuwill000
/

test0001

Runtime error

hsuwill000 commited on Feb 26

Commit

0d3a8e6

verified ·

1 Parent(s): a9e6e4a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -39,9 +39,9 @@ def setup_model(model_id):
     gguf_path = f"{local_dir}.gguf"
     if not os.path.exists(gguf_path):
         run_command(f'python llama.cpp/convert_hf_to_gguf.py ./{local_dir} --outfile {gguf_path}')
-    quantized_path = f"{local_dir}-Q2_K.gguf"
     if not os.path.exists(quantized_path):
-        run_command(f'./llama.cpp/build/bin/llama-quantize ./{gguf_path} {quantized_path} Q2_K')
     return quantized_path
 def chat_with_model(message, history, system_prompt, temperature, max_tokens, top_k, top_p):

     gguf_path = f"{local_dir}.gguf"
     if not os.path.exists(gguf_path):
         run_command(f'python llama.cpp/convert_hf_to_gguf.py ./{local_dir} --outfile {gguf_path}')
+    quantized_path = f"{local_dir}-IQ2_XXS.gguf"
     if not os.path.exists(quantized_path):
+        run_command(f'./llama.cpp/build/bin/llama-quantize ./{gguf_path} {quantized_path} IQ2_XXS')
     return quantized_path
 def chat_with_model(message, history, system_prompt, temperature, max_tokens, top_k, top_p):