Spaces:

Manofem
/

Test

Runtime error

Manofem commited on Jan 14, 2024

Commit

2b66b31

verified ·

1 Parent(s): 66d4c12

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,21 +2,20 @@ import time
 import gradio as gr
 from ctransformers import AutoModelForCausalLM
 llm = AutoModelForCausalLM.from_pretrained("TheBloke/WizardLM-7B-uncensored-GGUF", model_file="WizardLM-7B-uncensored.Q3_K_M.gguf", model_type="llama", stream=True)
-history = ["Chatbot:"]
 def generate_response(message):
     global history
-    token_count = 0
     for text in llm(message):
         response = ''.join(text)
         history.append(response)
-        token_count += len(response.split())
-        if token_count >= 2:
-            yield ' '.join(history)
-            token_count = 0
-            # Clear the history list after generating a response
-            history = ["Chatbot:"]
 def chatbot(message, history):
     response_generator = generate_response(message)
@@ -25,4 +24,5 @@ def chatbot(message, history):
         yield response
 iface = gr.ChatInterface(chatbot)
-iface.launch()

 import gradio as gr
 from ctransformers import AutoModelForCausalLM
+# Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.
 llm = AutoModelForCausalLM.from_pretrained("TheBloke/WizardLM-7B-uncensored-GGUF", model_file="WizardLM-7B-uncensored.Q3_K_M.gguf", model_type="llama", stream=True)
+history = [""]
 def generate_response(message):
     global history
     for text in llm(message):
         response = ''.join(text)
+        time.sleep(2)
         history.append(response)
+        yield ' '.join(history)
+    # Clear the history list after the last response
+    history = ["Chatbot:"]
 def chatbot(message, history):
     response_generator = generate_response(message)
         yield response
 iface = gr.ChatInterface(chatbot)
+iface.launch()
+Can you make the response variable store every 2 words/tokens