jedeland commited on
Commit
957293d
·
1 Parent(s): 42390f7

q4 model fast

Browse files
Files changed (1) hide show
  1. app.py +8 -8
app.py CHANGED
@@ -1,17 +1,17 @@
1
  import gradio as gr
2
 
3
- from llama_cpp import Llama, LlamaTokenizer
4
-
5
- # llm = Llama.from_pretrained(
6
- # repo_id="ID2223JR/gguf_model",
7
- # filename="unsloth.Q4_K_M.gguf",
8
- # )
9
 
10
  llm = Llama.from_pretrained(
11
- repo_id="ID2223JR/gguf_model_q8",
12
- filename="unsloth.Q8_0.gguf",
13
  )
14
 
 
 
 
 
 
15
 
16
  # Data storage
17
  ingredients_list = []
 
1
  import gradio as gr
2
 
3
+ from llama_cpp import Llama
 
 
 
 
 
4
 
5
  llm = Llama.from_pretrained(
6
+ repo_id="ID2223JR/gguf_model",
7
+ filename="unsloth.Q4_K_M.gguf",
8
  )
9
 
10
+ # llm = Llama.from_pretrained(
11
+ # repo_id="ID2223JR/gguf_model_q8",
12
+ # filename="unsloth.Q8_0.gguf",
13
+ # )
14
+
15
 
16
  # Data storage
17
  ingredients_list = []