ChatInterface

Sleeping

App Files Files Community

ChatInterface / app.py

ProximileAdmin

Update app.py

0ac657c verified 3 months ago

raw

history blame contribute delete

5.76 kB

	import os
	import gradio as gr
	from openai import OpenAI
	from typing import List, Tuple

	CLIENTS = {
	"perplexity": {"key": os.getenv('PX_KEY'), "endpoint": "https://api.perplexity.ai"},
	"hyperbolic": {"key": os.getenv('HYPERBOLIC_XYZ_KEY'), "endpoint": "https://api.hyperbolic.xyz/v1"},
	"huggingface": {"key": os.getenv('HF_KEY'), "endpoint": "https://huggingface.co/api/inference-proxy/together"},
	}
	for client_type in CLIENTS:
	CLIENTS[client_type]["client"] = OpenAI(
	base_url=CLIENTS[client_type]["endpoint"],
	api_key=CLIENTS[client_type]["key"]
	)

	PASSWORD = os.getenv("PASSWD")

	# Define available models
	AVAILABLE_MODELS = {
	"Llama3.3-70b-Instruct (Hyperbolic.xyz)": {
	"model_name": "meta-llama/Llama-3.3-70B-Instruct",
	"type": "hyperbolic"
	},
	"Llama3.1-8b-Instruct (Hyperbolic.xyz)": {
	"model_name": "meta-llama/Meta-Llama-3.1-8B-Instruct",
	"type": "hyperbolic"
	},
	"DeepSeek V3 (Hyperbolic.xyz)": {
	"model_name": "deepseek-ai/DeepSeek-V3",
	"type": "hyperbolic"
	},
	"DeepSeek V3 (HuggingFace.co)": {
	"model_name": "deepseek-ai/DeepSeek-V3",
	"type": "huggingface"
	},
	"Sonar Pro (Perplexity.ai)": {
	"model_name": "sonar-pro",
	"type": "perplexity"
	},
	"Sonar (Perplexity.ai)": {
	"model_name": "sonar",
	"type": "perplexity"
	},
	}

	def respond(
	message: str,
	history: List[Tuple[str, str]],
	session_password: str, # added parameter from session state
	system_message: str,
	model_choice: str,
	max_tokens: int,
	temperature: float,
	top_p: float,
	):
	"""Handles chatbot responses with password re-checking."""
	# Re-check the session password on every message
	if session_password != PASSWORD:
	yield "Error: Invalid session password. Please refresh the page and enter the correct password."
	return

	if model_choice not in AVAILABLE_MODELS:
	yield "Error: Invalid model selection."
	return

	messages = [{"role": "system", "content": system_message}]
	for user_msg, assistant_msg in history:
	if user_msg:
	messages.append({"role": "user", "content": user_msg})
	if assistant_msg:
	messages.append({"role": "assistant", "content": assistant_msg})
	messages.append({"role": "user", "content": message})

	response = ""
	citations = []

	selected_client = CLIENTS[AVAILABLE_MODELS[model_choice]["type"]]["client"]

	try:
	stream = selected_client.chat.completions.create(
	model=AVAILABLE_MODELS[model_choice]["model_name"],
	messages=messages,
	max_tokens=max_tokens,
	temperature=temperature,
	top_p=top_p,
	stream=True,
	)

	for chunk in stream:
	if hasattr(chunk, "choices") and chunk.choices:
	token = chunk.choices[0].delta.content or ""
	response += token
	yield response # Stream response as it arrives
	if hasattr(chunk, "citations") and chunk.citations:
	citations = chunk.citations

	# Append citations as clickable links, if any
	if citations:
	citation_text = "\n\nSources:\n" + "\n".join(
	[f"[{i+1}] [{url}]({url})" for i, url in enumerate(citations)]
	)
	response += citation_text
	yield response

	except Exception as e:
	yield f"Error: {str(e)}"


	def check_password(input_password):
	"""Validates the password and, if valid, stores it in session state."""
	if input_password == PASSWORD:
	# Return the password to store in the session state.
	return gr.update(visible=False), gr.update(visible=True), input_password
	else:
	return gr.update(value="", interactive=True), gr.update(visible=False), ""

	with gr.Blocks() as demo:
	# A hidden state component to store the session password
	session_password = gr.State("")

	with gr.Column():
	password_input = gr.Textbox(
	type="password", label="Enter Password", interactive=True
	)
	submit_button = gr.Button("Submit")
	error_message = gr.Textbox(
	label="Error", visible=False, interactive=False
	)

	with gr.Column(visible=False) as chat_interface:
	system_prompt = gr.Textbox(
	value="You are a helpful assistant.", label="System message"
	)
	model_choice = gr.Dropdown(
	choices=list(AVAILABLE_MODELS.keys()),
	value=list(AVAILABLE_MODELS.keys())[0],
	label="Select Model"
	)
	max_tokens = gr.Slider(
	minimum=1, maximum=30000, value=2048, step=100, label="Max new tokens"
	)
	temperature = gr.Slider(
	minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"
	)
	top_p = gr.Slider(
	minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-p (nucleus sampling)"
	)

	# Note: The session_password is now passed as an additional input to the chat function.
	chat = gr.ChatInterface(
	fn=respond,
	api_name=False,
	chatbot=gr.Chatbot(height=400), # Set desired height here
	additional_inputs=[session_password, system_prompt, model_choice, max_tokens, temperature, top_p]
	)

	# Now, the submit_button click updates three outputs: the password_input, chat_interface visibility, and session_password state.
	submit_button.click(
	fn=check_password,
	inputs=password_input,
	outputs=[password_input, chat_interface, session_password]
	)

	if __name__ == "__main__":
	demo.launch()