# Introduction to Machine Learning

This notebook is an example of a CNN for recognizing handwritten characters.

Most of this code is from https://keras.io/examples/vision/mnist_convnet/

## Setup

In [1]:
import numpy as np
import tensorflow as tf
from tensorflow import keras
from tensorflow.keras import layers

# Hide GPU from visible devices
tf.config.set_visible_devices([], 'GPU')

## Prepare the data

In [2]:
# Model / data parameters
num_classes = 10
input_shape = (28, 28, 1)

# Load the data and split it between train and test sets
(x_train, y_train), (x_test, y_test) = keras.datasets.mnist.load_data()

# Scale images to the [0, 1] range
x_train = x_train.astype("float32") / 255
x_test = x_test.astype("float32") / 255

# Make sure images have shape (28, 28, 1)
x_train = np.expand_dims(x_train, -1)
x_test = np.expand_dims(x_test, -1)
print("x_train shape:", x_train.shape)
print(x_train.shape[0], "train samples")
print(x_test.shape[0], "test samples")


# convert class vectors to binary class matrices
y_train = keras.utils.to_categorical(y_train, num_classes)
y_test = keras.utils.to_categorical(y_test, num_classes)
# [1, 2, 3, 4] -> [[1, 0, 0, 0], [0, 1, 0, 0], [0, 0, 1, 0], [0, 0, 0, 1]]


x_train shape: (60000, 28, 28, 1)
60000 train samples
10000 test samples


## Build the Model

In [3]:
model = keras.Sequential(
 [
 keras.Input(shape=input_shape),
 layers.Conv2D(32, kernel_size=(3, 3), activation="relu"),
 layers.MaxPooling2D(pool_size=(2, 2)),
 layers.Conv2D(64, kernel_size=(3, 3), activation="relu"),
 layers.MaxPooling2D(pool_size=(2, 2)),
 layers.Flatten(),
 layers.Dropout(0.5),
 layers.Dense(num_classes, activation="softmax"),
 ]
)

model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type) Output Shape Param # 
 conv2d (Conv2D) (None, 26, 26, 32) 320 
 
 max_pooling2d (MaxPooling2D (None, 13, 13, 32) 0 
 ) 
 
 conv2d_1 (Conv2D) (None, 11, 11, 64) 18496 
 
 max_pooling2d_1 (MaxPooling (None, 5, 5, 64) 0 
 2D) 
 
 flatten (Flatten) (None, 1600) 0 
 
 dropout (Dropout) (None, 1600) 0 
 
 dense (Dense) (None, 10) 16010 
 
Total params: 34,826
Trainable params: 34,826
Non-trainable params: 0
_________________________________________________________________


## Train the Model

In [4]:
batch_size = 128
epochs = 15

model.compile(loss="categorical_crossentropy", optimizer="adam", metrics=["accuracy"])

In [5]:
# This line can be run multiple times, but keep in mind that the model will probably be over fitting

model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs, validation_split=0.1)

Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15




## Evaluate the Trained Model

In [6]:
score = model.evaluate(x_test, y_test, verbose=0)
print("Test loss:", score[0])
print("Test accuracy:", score[1])

Test loss: 0.02596166729927063
Test accuracy: 0.9919000267982483


## Save Model (h5 format)

In [13]:
model.save("mnist.h5")