Update app.py
Browse files
app.py
CHANGED
@@ -3,8 +3,8 @@ import gradio as gr
|
|
3 |
from ctransformers import AutoModelForCausalLM
|
4 |
|
5 |
# Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.
|
6 |
-
model_path = "WizardLM-7B-uncensored.Q3_K_S.gguf"
|
7 |
-
llm = AutoModelForCausalLM.from_pretrained(model_path, model_type="llama")
|
8 |
|
9 |
def generate_response(message):
|
10 |
response = llm(message)
|
|
|
3 |
from ctransformers import AutoModelForCausalLM
|
4 |
|
5 |
# Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.
|
6 |
+
model_path = "TheBloke/WizardLM-7B-uncensored.Q3_K_S.gguf"
|
7 |
+
llm = AutoModelForCausalLM.from_pretrained(model_path, model_type="llama",stream=True)
|
8 |
|
9 |
def generate_response(message):
|
10 |
response = llm(message)
|