Manofem commited on
Commit
4916fa9
·
verified ·
1 Parent(s): 1618b23

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -3,8 +3,8 @@ import gradio as gr
3
  from ctransformers import AutoModelForCausalLM
4
 
5
  # Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.
6
- model_path = "WizardLM-7B-uncensored.Q3_K_S.gguf"
7
- llm = AutoModelForCausalLM.from_pretrained(model_path, model_type="llama")
8
 
9
  def generate_response(message):
10
  response = llm(message)
 
3
  from ctransformers import AutoModelForCausalLM
4
 
5
  # Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.
6
+ model_path = "TheBloke/WizardLM-7B-uncensored.Q3_K_S.gguf"
7
+ llm = AutoModelForCausalLM.from_pretrained(model_path, model_type="llama",stream=True)
8
 
9
  def generate_response(message):
10
  response = llm(message)