Spaces:

alibayram
/

mnist

Runtime error

App Files Files Community

alibayram commited on Dec 7, 2024

Commit

4c5bd22

1 Parent(s): 095137d

Refactor app.py: update app title and description, simplify label handling, and enhance prediction function

Browse files

Files changed (2) hide show

app.py +28 -77
requirements.txt +3 -3

app.py CHANGED Viewed

@@ -1,96 +1,47 @@
-import numpy as np
 import gradio as gr
 import tensorflow as tf
 import cv2
-# App title
-title = "Welcome to your first sketch recognition app!"
-# App description
 head = (
-    "<center>"
-    "<img src='./mnist-classes.png' width=400>"
-    "<p>The model is trained to classify numbers (from 0 to 9). "
-    "To test it, draw your number in the space provided.</p>"
-    "</center>"
 )
 # GitHub repository link
-ref = "Find the complete code [here](https://github.com/ovh/ai-training-examples/tree/main/apps/gradio/sketch-recognition)."
-# Class names (from 0 to 9)
-labels = {
-    0: "zero",
-    1: "one",
-    2: "two",
-    3: "three",
-    4: "four",
-    5: "five",
-    6: "six",
-    7: "seven",
-    8: "eight",
-    9: "nine"
-}
-# Load model (trained on MNIST dataset)
-model = tf.keras.models.load_model("./sketch_recognition_numbers_model.h5")
-def predict(data):
-    # Convert to NumPy array
-    img = np.array(data['composite'])
-    # print non-zero values
-    print("non-zero values", np.count_nonzero(img))
-    for i in range(img.shape[0]):
-        for j in range(img.shape[1]):
-            if img[i][j] > 0:
-                print(i, j, img[i][j])
-    print("img.shape", img.shape)
-    # Handle RGBA or RGB images
-    if img.shape[-1] == 4:  # RGBA
-        img = cv2.cvtColor(img, cv2.COLOR_RGBA2RGB)
-    if img.shape[-1] == 3:  # RGB
-        img = cv2.cvtColor(img, cv2.COLOR_RGB2GRAY)
-    # Resize image to 28x28
-    img = cv2.resize(img, (28, 28))
-    # Normalize pixel values to [0, 1]
-    img = img / 255.0
-    # Reshape to match model input
-    img = img.reshape(1, 28, 28, 1)
-    print("img", img)
-    # Model predictions
-    preds = model.predict(img)[0]
-    print("preds", preds)
-    values_map = {preds[i]: i for i in range(len(preds))}
-    sorted_values = sorted(preds, reverse=True)
-    labels_map = dict()
-    for i in range(3):
-        print("sorted_values[i]", sorted_values[i], values_map[sorted_values[i]])
-        labels_map[labels[values_map[sorted_values[i]]]] = sorted_values[i]
-    print("labels_map", labels_map)
-    return labels_map
-# Top 3 classes
-label = gr.Label(num_top_classes=3)
-# Open Gradio interface for sketch recognition
-interface = gr.Interface(
-    fn=predict,
-    inputs=gr.Sketchpad(type='numpy', image_mode='L', brush=gr.Brush()),
-    outputs=label,
-    title=title,
-    description=head,
-    article=ref
-)
 interface.launch(share=True)

+# import dependencies
 import gradio as gr
 import tensorflow as tf
 import cv2
+# app title
+title = "Welcome on your first sketch recognition app!"
+# app description
 head = (
+  "<center>"
+  "<img src='file/mnist-classes.png' width=400>"
+  "The robot was trained to classify numbers (from 0 to 9). To test it, write your number in the space provided."
+  "</center>"
 )
 # GitHub repository link
+ref = "Find the whole code [here](https://github.com/ovh/ai-training-examples/tree/main/apps/gradio/sketch-recognition)."
+# image size: 28x28
+img_size = 28
+# classes name (from 0 to 9)
+labels = ["zero", "one", "two", "three", "four", "five", "six", "seven", "eight", "nine"]
+# load model (trained on MNIST dataset)
+model = tf.keras.models.load_model("model/sketch_recognition_numbers_model.h5")
+# prediction function for sketch recognition
+def predict(img):
+  # image shape: 28x28x1
+  img = cv2.resize(img, (img_size, img_size))
+  img = img.reshape(1, img_size, img_size, 1)
+  # model predictions
+  preds = model.predict(img)[0]
+  # return the probability for each classe
+  return {label: float(pred) for label, pred in zip(labels, preds)}
+# top 3 of classes
+label = gr.outputs.Label(num_top_classes=3)
+# open Gradio interface for sketch recognition
+interface = gr.Interface(fn=predict, inputs="sketchpad", outputs=label, title=title, description=head, article=ref)
 interface.launch(share=True)

requirements.txt CHANGED Viewed

@@ -1,3 +1,3 @@
-tensorflow
-opencv-python-headless
-numpy

+gradio==3.0.10
+tensorflow==2.9.1
+opencv-python-headless==4.6.0.66