Spaces:

ignitariumcloud
/

Voice_Controlled_Shop_Assistant_System

Sleeping

App Files Files Community

Voice_Controlled_Shop_Assistant_System / app.py

arjunanand13

Update app.py

6219b13 verified 7 days ago

raw

history blame

5.5 kB

	import os
	import sqlite3
	import requests
	import openai
	import gradio as gr
	import asyncio
	from gtts import gTTS
	from typing_extensions import TypedDict
	from langgraph.graph import StateGraph, START, END
	import csv

	# Load API keys
	openai.api_key = os.getenv("OPENAI_API_KEY")

	# --- Initialize Database from external CSV ---
	def init_db_from_csv(csv_path: str = "transactions.csv") -> None:
	"""Create 'transactions' table and load data from the provided CSV file."""
	conn = sqlite3.connect("shop.db")
	cur = conn.cursor()
	cur.execute(
	"CREATE TABLE IF NOT EXISTS transactions (date TEXT, product TEXT, amount REAL)"
	)
	with open(csv_path, newline='') as f:
	reader = csv.DictReader(f)
	rows = [(row["date"], row["product"], float(row["amount"])) for row in reader]
	# Replace old data
	cur.execute("DELETE FROM transactions")
	cur.executemany(
	"INSERT INTO transactions (date, product, amount) VALUES (?, ?, ?)", rows
	)
	conn.commit()
	conn.close()

	# Initialize DB at startup (ensure transactions.csv is present)
	init_db_from_csv()

	# --- Business Logic Functions ---

	def db_agent(query: str) -> str:
	try:
	conn = sqlite3.connect("shop.db")
	cur = conn.cursor()
	cur.execute(
	"""
	SELECT product, SUM(amount) AS revenue
	FROM transactions
	WHERE date = date('now')
	GROUP BY product
	ORDER BY revenue DESC
	LIMIT 1
	"""
	)
	row = cur.fetchone()
	if row:
	return f"Top product today: {row[0]} with ₹{row[1]:,.2f}"
	return "No transactions found for today."
	except sqlite3.OperationalError as e:
	return f"Database error: {e}. Please check 'transactions' table in shop.db."


	def web_search_agent(query: str) -> str:
	try:
	resp = requests.get(
	"https://serpapi.com/search",
	params={"q": query, "api_key": os.getenv("SERPAPI_KEY")}
	)
	snippet = resp.json().get("organic_results", [{}])[0].get("snippet", "").strip()
	if snippet:
	return llm_agent(f"Summarize: {snippet}")
	except Exception:
	pass
	return llm_agent(query)


	def llm_agent(query: str) -> str:
	response = openai.chat.completions.create(
	model="gpt-4o-mini",
	messages=[
	{"role": "system", "content": "You are a helpful assistant."},
	{"role": "user", "content": query},
	],
	temperature=0.2,
	)
	return response.choices[0].message.content.strip()


	def stt_agent(audio_path: str) -> str:
	with open(audio_path, "rb") as afile:
	transcript = openai.audio.transcriptions.create(
	model="whisper-1",
	file=afile
	)
	return transcript.text.strip()


	def tts_agent(text: str, lang: str = 'en') -> str:
	tts = gTTS(text=text, lang=lang)
	out_path = "response_audio.mp3"
	tts.save(out_path)
	return out_path

	# --- LangGraph State and Nodes ---
	class State(TypedDict):
	query: str
	result: str

	# Routing logic based on query

	def route_fn(state: State) -> str:
	q = state["query"].lower()
	if any(k in q for k in ["max revenue", "revenue"]):
	return "db"
	if any(k in q for k in ["who", "what", "when", "where"]):
	return "web"
	return "llm"

	# Node implementations

	def router_node(state: State) -> dict:
	return {"query": state["query"]}

	def db_node(state: State) -> dict:
	return {"result": db_agent(state["query"]) }

	def web_node(state: State) -> dict:
	return {"result": web_search_agent(state["query"]) }

	def llm_node(state: State) -> dict:
	return {"result": llm_agent(state["query"]) }

	# Build the LangGraph
	builder = StateGraph(State)
	builder.add_node("router", router_node)
	builder.set_entry_point("router")
	builder.set_conditional_entry_point(
	route_fn,
	path_map={"db": "db", "web": "web", "llm": "llm"}
	)
	builder.add_node("db", db_node)
	builder.add_node("web", web_node)
	builder.add_node("llm", llm_node)
	builder.add_edge(START, "router")
	builder.add_edge("db", END)
	builder.add_edge("web", END)
	builder.add_edge("llm", END)
	graph = builder.compile()

	# Handler integrates STT/TTS and graph execution
	def handle_query(audio_or_text: str):
	is_audio = audio_or_text.endswith('.wav') or audio_or_text.endswith('.mp3')
	if is_audio:
	query = stt_agent(audio_or_text)
	else:
	query = audio_or_text

	state = graph.invoke({"query": query})
	response = state["result"]

	if is_audio:
	audio_path = tts_agent(response)
	return response, audio_path
	return response

	# --- Gradio UI ---
	with gr.Blocks() as demo:
	gr.Markdown("## Shop Voice-Box Assistant (Speech In/Out)")
	inp = gr.Audio(sources=["microphone"], type="filepath", label="Speak or type your question or upload transactions.csv separately in root")
	out_text = gr.Textbox(label="Answer (text)")
	out_audio = gr.Audio(label="Answer (speech)")
	submit = gr.Button("Submit")
	# Examples
	gr.Examples(
	examples=[
	["What is the max revenue product today?"],
	["Who invented the light bulb?"],
	["Tell me a joke about cats."],
	],
	inputs=inp,
	outputs=[out_text, out_audio],
	)
	submit.click(fn=handle_query, inputs=inp, outputs=[out_text, out_audio])

	if __name__ == "__main__":
	demo.launch(share=False, server_name="0.0.0.0", server_port=7860)