Spaces:

arifdogan
/

invoice-ai-extractor

Sleeping

Add .idea config files, update README with detailed instructions, implement invoice extraction in app.py, and list dependencies in requirements.txt.

39e0658 verified 2 months ago

raw

history blame contribute delete

8.44 kB

	import io
	import json

	import fitz
	import streamlit as st
	import torch
	from PIL import Image, ImageGrab
	from transformers import pipeline

	# --- Configuration and Setup ---

	DEVICE = 0 if torch.cuda.is_available() else -1

	st.set_page_config(
	page_title="Invoice AI \| by Arif Dogan",
	page_icon="🧾",
	layout="wide",
	initial_sidebar_state="collapsed",
	)

	# --- Styling ---

	st.markdown(
	"""
	<style>
	.stApp {max-width: 1200px; margin: 0 auto}
	.stButton>button {background-color: #4CAF50; color: white; border-radius: 5px;}
	.stProgress>div>div {background-color: #4CAF50}
	footer {visibility: hidden}
	.high {color: #4CAF50; font-weight: bold}
	.medium {color: #FFA726; font-weight: bold}
	.low {color: #EF5350; font-weight: bold}
	div[data-testid="stToolbar"] {visibility: hidden; height: 0}
	[data-testid="stExpanderContent"] {background-color: rgba(67, 76, 94, 0.5);}
	.stTextInput>div>div {background-color: rgba(67, 76, 94, 0.5)}
	</style>
	""",
	unsafe_allow_html=True,
	)


	# --- Functions ---


	@st.cache_resource
	def load_model():
	return pipeline(
	"document-question-answering",
	model="faisalraza/layoutlm-invoices",
	device=DEVICE,
	)


	def process_pdf(pdf_file):
	pdf_content = pdf_file.read()
	pdf_stream = io.BytesIO(pdf_content)
	try:
	with fitz.open(stream=pdf_stream, filetype="pdf") as pdf_document:
	if pdf_document.page_count > 0:
	page = pdf_document[0]
	pix = page.get_pixmap(matrix=fitz.Matrix(300 / 72, 300 / 72))
	img_data = pix.tobytes("png")
	return Image.open(io.BytesIO(img_data)), pdf_document.page_count
	else:
	raise ValueError("PDF has no pages")
	except Exception as e:
	raise e
	finally:
	pdf_stream.close()


	def process_image(uploaded_file):
	uploaded_file.seek(0)
	if uploaded_file.type == "application/pdf":
	return process_pdf(uploaded_file)
	return Image.open(uploaded_file), 1


	def get_clipboard_image():
	try:
	img = ImageGrab.grabclipboard()
	return (img, 1) if isinstance(img, Image.Image) else (None, 0)
	except Exception:
	return None, 0


	def prepare_export_data(extracted_info, format_type):
	if format_type == "JSON":
	return json.dumps(
	{field: data["value"] for field, data in extracted_info.items()}, indent=2
	)
	elif format_type == "CSV":
	header = ",".join(extracted_info.keys())
	values = ",".join(f'"{data["value"]}"' for data in extracted_info.values())
	return f"{header}\n{values}"
	else: # TXT
	return "\n".join(
	f"{field}: {data['value']}" for field, data in extracted_info.items()
	)


	def extract_information(model, image, questions, progress_bar, status_text):
	extracted_info = {}
	for idx, question in enumerate(questions):
	try:
	# Update progress bar and status text
	progress_bar.progress((idx + 1) / len(questions))
	status_text.text(f"Processing: {question} ({idx + 1}/{len(questions)})")

	response = model(image=image, question=question)
	if (
	response and response[0].get("answer", "").strip()
	): # Check for non-empty answer
	answer = response[0]["answer"]
	confidence = response[0]["score"]

	if confidence > 0.1:
	field = (
	question.replace("What is the ", "").replace("?", "").title()
	)
	extracted_info[field] = {"value": answer, "confidence": confidence}
	except Exception:
	continue # Handle potential errors during model processing

	return extracted_info


	# --- Initialization ---

	if "processed_image" not in st.session_state:
	st.session_state.processed_image = None
	if "extracted_info" not in st.session_state:
	st.session_state.extracted_info = {}

	# --- UI Layout ---

	st.markdown(
	"""
	<div style='text-align: center; padding: 1rem;'>
	<h1>🧾 Invoice AI Extractor</h1>
	<p style='font-size: 1.2em; color: #999;'>Powered by LayoutLM</p>
	</div>
	""",
	unsafe_allow_html=True,
	)

	model = load_model()

	col1, col2 = st.columns([2, 1])

	with col1:
	uploaded_file = st.file_uploader(
	"Drop invoice (PDF, JPG, PNG)", type=["pdf", "jpg", "jpeg", "png"]
	)

	with col2:
	st.write("Or paste from clipboard (Ctrl/Cmd + V)")
	check_clipboard = st.button("📎 Check Clipboard")

	# --- Image Processing Logic ---

	if uploaded_file:
	try:
	image, _ = process_image(uploaded_file)
	st.session_state.processed_image = image
	st.session_state.extracted_info = {} # Reset on new upload
	except Exception as e:
	st.error(f"Error processing file: {e}")

	elif check_clipboard:
	clipboard_image, _ = get_clipboard_image()
	if clipboard_image:
	st.session_state.processed_image = clipboard_image
	st.session_state.extracted_info = {}
	st.success("Image loaded from clipboard")
	else:
	st.warning("No image found in clipboard")

	# --- Display and Information Extraction ---

	if st.session_state.processed_image:
	try:
	image = st.session_state.processed_image.convert("RGB")

	col1, col2 = st.columns([1, 1])

	with col1:
	st.image(image, caption="Document", use_container_width=True)

	with col2:
	st.markdown("### 📊 Extracted Information")

	if not st.session_state.extracted_info:
	questions = [
	"What is the invoice number?",
	"What is the invoice date?",
	"What is the total amount?",
	"What is the company name?",
	"What is the due date?",
	"What is the tax amount?",
	]

	# Create progress bar and status text elements
	progress_bar = st.progress(0)
	status_text = st.empty()

	st.session_state.extracted_info = extract_information(
	model, image, questions, progress_bar, status_text
	)

	# Clear status text after completion
	status_text.empty()

	if st.session_state.extracted_info:
	for field, data in st.session_state.extracted_info.items():
	conf_col, val_col = st.columns([1, 4])
	with val_col:
	st.text_input(
	field, data["value"], disabled=True, key=f"input_{field}"
	) # added key
	with conf_col:
	confidence = data["confidence"]
	css_class = (
	"high"
	if confidence > 0.7
	else "medium"
	if confidence > 0.4
	else "low"
	)
	st.markdown(
	f"<p class='{css_class}'>{confidence:.1%}</p>",
	unsafe_allow_html=True,
	)

	st.markdown("### 📥 Export")
	export_format = st.selectbox("Format", ["JSON", "CSV", "TXT"])
	export_data = prepare_export_data(
	st.session_state.extracted_info, export_format
	)
	file_extension = export_format.lower()
	st.download_button(
	"Download",
	export_data,
	file_name=f"invoice_data.{file_extension}",
	mime=f"text/{file_extension}",
	)
	else:
	st.warning(
	"Could not extract information. Please ensure the document is clear."
	)

	except Exception as e:
	st.error(f"Error during processing: {e}")

	# --- Footer ---

	st.markdown("---")
	st.markdown(
	"""
	<div style='text-align: center'>
	<p>Created by <a href='https://github.com/doganarif' target='_blank'>Arif Dogan</a> \|
	<a href='https://huggingface.co/arifdogan' target='_blank'>🤗 Hugging Face</a></p>
	</div>
	""",
	unsafe_allow_html=True,
	)