Spaces:

Manofem
/

Test

Runtime error

Manofem commited on Jan 13, 2024

Commit

c66f552

verified ·

1 Parent(s): 74753f3

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,11 +5,10 @@ from ctransformers import AutoModelForCausalLM
 # Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.
 llm = AutoModelForCausalLM.from_pretrained("TheBloke/WizardLM-7B-uncensored-GGUF", model_file="WizardLM-7B-uncensored.Q4_K_M.gguf", model_type="llama", stream=True)
 def generate_response(message):
-    for text in llm(message):
-        yield text
 def chatbot(message, history):

 # Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.
 llm = AutoModelForCausalLM.from_pretrained("TheBloke/WizardLM-7B-uncensored-GGUF", model_file="WizardLM-7B-uncensored.Q4_K_M.gguf", model_type="llama", stream=True)
 def generate_response(message):
+    tokens = llm(message)
+    response_sentence = ' '.join(tokens)
+    yield response_sentence
 def chatbot(message, history):