Spaces:

rwayz
/

ModelsChatBot

Running

App Files Files Community

rwayz commited on Mar 21

Commit

a8b1809

verified ·

1 Parent(s): 26425fc

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -9

app.py CHANGED Viewed

@@ -2,29 +2,35 @@ import gradio as gr
 from huggingface_hub import InferenceClient
 import os
 import time
 HF_TOKEN = os.getenv("HF_TOKEN")
 client = InferenceClient(
     provider="sambanova",
     api_key=HF_TOKEN,
 )
 MODELS = {
     "LLaMA 70B": "meta-llama/Llama-3.3-70B-Instruct",
     "Qwen 32B": "Qwen/QwQ-32B",
-    "DeepSeek R1":"deepseek-ai/DeepSeek-R1",
 }
 history_log = []
 show_history_flag = False
 def chatbot_response(user_input, model_name):
     model_id = MODELS[model_name]
     messages = [{"role": "user", "content": entry["Pergunta"]} for entry in history_log[-2:]]
     messages.append({"role": "user", "content": user_input})
     start_time = time.time()
     try:
         completion = client.chat.completions.create(
@@ -36,26 +42,26 @@ def chatbot_response(user_input, model_name):
     except Exception as e:
         response = f"Erro ao gerar resposta: {str(e)}"
     end_time = time.time()
     history_log.append({
         "Modelo": model_name,
         "Pergunta": user_input,
         "Resposta": response,
         "Tempo de Resposta (s)": round(end_time - start_time, 2)
     })
     return response
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     with gr.Row():
         with gr.Column(scale=1):
             gr.Markdown("## ⚙️ Configurações")
-            model_selector = gr.Radio(
                 choices=list(MODELS.keys()),
                 label="Escolha o Modelo",
                 value="LLaMA 70B"
             )
         with gr.Column(scale=4):
             gr.Markdown("# 🤖 Chatbot - API SambaNova")
             chatbot = gr.Chatbot(height=500)
@@ -63,16 +69,16 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
             with gr.Row():
                 btn = gr.Button("Enviar", variant="primary")
                 history_btn = gr.Button("Histórico", variant="secondary")
             history_output = gr.JSON()
     def respond(message, chat_history, model_name):
         response = chatbot_response(message, model_name)
         chat_history.append((message, response))
         return "", chat_history
     btn.click(respond, [msg, chatbot, model_selector], [msg, chatbot])
-    msg.submit(respond, [msg, chatbot, model_selector], [msg, chatbot])
     def toggle_history():
         global show_history_flag
@@ -81,5 +87,6 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
     history_btn.click(toggle_history, inputs=[], outputs=history_output)
 if __name__ == "__main__":
     demo.launch()

 from huggingface_hub import InferenceClient
 import os
 import time
+import re  # para limpar tags como <think>
+# Token de autenticação
 HF_TOKEN = os.getenv("HF_TOKEN")
+# Cliente da API da HuggingFace/SambaNova
 client = InferenceClient(
     provider="sambanova",
     api_key=HF_TOKEN,
 )
+# Modelos disponíveis
 MODELS = {
     "LLaMA 70B": "meta-llama/Llama-3.3-70B-Instruct",
     "Qwen 32B": "Qwen/QwQ-32B",
+    "DeepSeek R1": "deepseek-ai/DeepSeek-R1",
 }
 history_log = []
 show_history_flag = False
+def clean_response(text):
+    return re.sub(r"</?think>", "", text).strip()
 def chatbot_response(user_input, model_name):
     model_id = MODELS[model_name]
     messages = [{"role": "user", "content": entry["Pergunta"]} for entry in history_log[-2:]]
     messages.append({"role": "user", "content": user_input})
     start_time = time.time()
     try:
         completion = client.chat.completions.create(
     except Exception as e:
         response = f"Erro ao gerar resposta: {str(e)}"
     end_time = time.time()
     history_log.append({
         "Modelo": model_name,
         "Pergunta": user_input,
         "Resposta": response,
         "Tempo de Resposta (s)": round(end_time - start_time, 2)
     })
     return response
+# Interface Gradio
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     with gr.Row():
         with gr.Column(scale=1):
             gr.Markdown("## ⚙️ Configurações")
+            model_selector = gr.Dropdown(
                 choices=list(MODELS.keys()),
                 label="Escolha o Modelo",
                 value="LLaMA 70B"
             )
         with gr.Column(scale=4):
             gr.Markdown("# 🤖 Chatbot - API SambaNova")
             chatbot = gr.Chatbot(height=500)
             with gr.Row():
                 btn = gr.Button("Enviar", variant="primary")
                 history_btn = gr.Button("Histórico", variant="secondary")
             history_output = gr.JSON()
     def respond(message, chat_history, model_name):
         response = chatbot_response(message, model_name)
+        response = clean_response(response)
         chat_history.append((message, response))
         return "", chat_history
     btn.click(respond, [msg, chatbot, model_selector], [msg, chatbot])
+    msg.submit(respond, [msg, chatbot, model_selector], [msg, chatbot])
     def toggle_history():
         global show_history_flag
     history_btn.click(toggle_history, inputs=[], outputs=history_output)
+# Executa o app
 if __name__ == "__main__":
     demo.launch()