mnist / app.py
alibayram's picture
Refactor prediction function: update data logging, reshape input handling, and simplify sketchpad configuration
fec34a0
raw
history blame
1.63 kB
import numpy as np
import gradio as gr
import tensorflow as tf
# App title
title = "Welcome to your first sketch recognition app!"
# App description
head = (
"<center>"
"<img src='./mnist-classes.png' width=400>"
"<p>The model is trained to classify numbers (from 0 to 9). "
"To test it, draw your number in the space provided.</p>"
"</center>"
)
# GitHub repository link
ref = "Find the complete code [here](https://github.com/ovh/ai-training-examples/tree/main/apps/gradio/sketch-recognition)."
# Image size: 28x28
img_size = 28
# Class names (from 0 to 9)
labels = ["zero", "one", "two", "three", "four", "five", "six", "seven", "eight", "nine"]
# Load model (trained on MNIST dataset)
model = tf.keras.models.load_model("./sketch_recognition_numbers_model.h5")
# Prediction function for sketch recognition
def predict(data):
print(data.shape)
# Reshape image to 28x28
img = np.reshape(data['composite'], (1, img_size, img_size, 1))
# Make prediction
pred = model.predict(img)
# Get top class
top_3_classes = np.argsort(pred[0])[-3:][::-1]
# Get top 3 probabilities
top_3_probs = pred[0][top_3_classes]
# Get class names
class_names = [labels[i] for i in top_3_classes]
# Return class names and probabilities
return {class_names[i]: top_3_probs[i] for i in range(3)}
# Top 3 classes
label = gr.Label(num_top_classes=3)
# Open Gradio interface for sketch recognition
interface = gr.Interface(
fn=predict,
inputs=gr.Sketchpad(type='numpy'),
outputs=label,
title=title,
description=head,
article=ref
)
interface.launch()