Spaces:

dejanseo
/

bulgarian-search-query-intent-classifier

Running

App Files Files Community

bulgarian-search-query-intent-classifier / app.py

dejanseo

Create app.py

a794f66 verified 2 months ago

raw

history blame

6.12 kB

	import os
	import json
	import torch
	import streamlit as st
	import pandas as pd
	from transformers import AutoModelForSequenceClassification, AutoTokenizer

	# ==============================
	# ⚙️ CONFIGURABLE PARAMETERS
	# ==============================
	MODEL_PATH = "dejanseo/bulgarian-search-query-intent-alpha" # HF model repository
	LABEL_MAP_PATH = "label_map.json" # Ensure this file is in the same directory as app.py
	DEVICE = "cuda" if torch.cuda.is_available() else "cpu"

	# ==============================
	# 📌 Load Model and Tokenizer
	# ==============================
	@st.cache_resource
	def load_inference_resources():
	# Load the label mapping from local file
	with open(LABEL_MAP_PATH, "r") as f:
	label_map = json.load(f)

	# Convert ID keys from string to int for id_to_label mapping
	id_to_label = {int(k): v for k, v in label_map["id_to_label"].items()}

	# Load the tokenizer and model from Hugging Face
	tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH)
	model = AutoModelForSequenceClassification.from_pretrained(MODEL_PATH)
	model.to(DEVICE)
	model.eval() # Set model to evaluation mode

	return model, tokenizer, label_map["label_to_id"], id_to_label

	# ==============================
	# 📌 Inference Function
	# ==============================
	def predict_intent(query, model, tokenizer, id_to_label):
	"""
	Predict the intent of a Bulgarian search query.
	"""
	# Tokenize input text
	inputs = tokenizer(
	query,
	padding="max_length",
	truncation=True,
	max_length=128,
	return_tensors="pt"
	)

	# Move inputs to the same device as the model
	inputs = {k: v.to(DEVICE) for k, v in inputs.items()}

	# Inference without gradient tracking
	with torch.no_grad():
	outputs = model(**inputs)

	# Compute probabilities with softmax
	probabilities = torch.nn.functional.softmax(outputs.logits, dim=1)[0]

	# Identify the predicted class and confidence
	predicted_class_id = torch.argmax(probabilities).item()
	predicted_intent = id_to_label[predicted_class_id]
	confidence = probabilities[predicted_class_id].item()

	# Build a dictionary with all intent scores
	all_intents = {id_to_label[i]: prob.item() for i, prob in enumerate(probabilities)}
	sorted_intents = sorted(all_intents.items(), key=lambda x: x[1], reverse=True)

	return {
	"query": query,
	"predicted_intent": predicted_intent,
	"confidence": confidence,
	"all_scores": sorted_intents
	}

	# ==============================
	# 🌟 Streamlit UI for Inference
	# ==============================
	def inference_ui():
	st.title("🔍 Bulgarian Search Intent Classification")

	try:
	# Load resources
	model, tokenizer, label_to_id, id_to_label = load_inference_resources()
	st.success(f"✅ Model loaded successfully! Found {len(id_to_label)} intent classes.")

	# Show available intents
	with st.expander("Available Intent Classes"):
	st.write(", ".join(id_to_label.values()))

	# Single query inference
	query = st.text_input("Enter a Bulgarian search query:", "Как да направя резервация за ресторант?")

	if st.button("Predict Intent"):
	with st.spinner("Analyzing query..."):
	prediction = predict_intent(query, model, tokenizer, id_to_label)

	st.subheader("Prediction Results")
	st.metric(
	label="Predicted Intent",
	value=prediction["predicted_intent"],
	delta=f"{prediction['confidence']*100:.2f}% confidence"
	)

	st.subheader("Intent Probabilities")
	df_probs = pd.DataFrame(prediction["all_scores"], columns=["Intent", "Probability"])
	df_top5 = df_probs.head(5)
	st.bar_chart(df_top5.set_index("Intent"))

	with st.expander("View All Intent Probabilities"):
	st.dataframe(df_probs)

	# Batch inference section
	st.subheader("Batch Inference")
	uploaded_file = st.file_uploader("Upload a CSV/Excel file with queries", type=["csv", "xlsx", "parquet"])

	if uploaded_file is not None:
	if uploaded_file.name.endswith(".csv"):
	df = pd.read_csv(uploaded_file)
	elif uploaded_file.name.endswith(".xlsx"):
	df = pd.read_excel(uploaded_file)
	elif uploaded_file.name.endswith(".parquet"):
	df = pd.read_parquet(uploaded_file)

	query_column = "query" if "query" in df.columns else st.selectbox("Select the column containing queries:", df.columns)

	if query_column and st.button("Run Batch Inference"):
	progress_bar = st.progress(0)
	results = []

	for i, row in enumerate(df[query_column]):
	progress_bar.progress((i + 1) / len(df))
	prediction = predict_intent(row, model, tokenizer, id_to_label)
	results.append({
	"query": row,
	"predicted_intent": prediction["predicted_intent"],
	"confidence": prediction["confidence"]
	})

	results_df = pd.DataFrame(results)
	st.subheader("Batch Inference Results")
	st.dataframe(results_df)

	csv = results_df.to_csv(index=False)
	st.download_button(
	label="Download Results as CSV",
	data=csv,
	file_name="batch_inference_results.csv",
	mime="text/csv"
	)

	except Exception as e:
	st.error(f"❌ Error loading model: {str(e)}")
	st.error("Please ensure the model and label map files are available.")

	if __name__ == "__main__":
	inference_ui()