import matplotlib.pyplot as plt
import numpy as np
import random
import requests

from io import BytesIO
from PIL import Image, ImageEnhance, ImageOps
from tensorflow.keras.datasets import mnist
from tensorflow.keras import models, layers


# Load the MNIST dataset into training and testing sets
(train_images, train_labels), (test_images, test_labels) = mnist.load_data()


# Print the shape of the entire training dataset (number of images, image width, image height)
print("Train dataset: ", train_images.shape)

# Print the type
print(type(train_images))

Train dataset:  (60000, 28, 28)
<class 'numpy.ndarray'>


# Print the shape of the entire test dataset (number of images, image width, image height)
print("Test dataset: ", test_images.shape)

Test dataset:  (10000, 28, 28)


# Print rows 12 to 14 of the first image in the training dataset (0 = black, 255 = white)
print("Three rows from the first image:")
print(train_images[0][12])
print(train_images[0][13])
print(train_images[0][14])

Three rows from the first image:
[  0   0   0   0   0   0   0   0   0   0   0  11 190 253  70   0   0   0
   0   0   0   0   0   0   0   0   0   0]
[  0   0   0   0   0   0   0   0   0   0   0   0  35 241 225 160 108   1
   0   0   0   0   0   0   0   0   0   0]
[  0   0   0   0   0   0   0   0   0   0   0   0   0  81 240 253 253 119
  25   0   0   0   0   0   0   0   0   0]


# Set the figure size for the plot (8x3 inch)
plt.rcParams["figure.figsize"] = (8, 3)

# Loop to display 12 random images from the training dataset
for i in range(12):

    # Create a subplot for each image (the i+1 parameter specified where the image will be displayed)
    plt.subplot(2, 6, i+1)

    # Randomly select an image
    num = random.randint(0, len(train_images))

    # Display the image in grayscale
    plt.imshow(train_images[num], cmap="gray", interpolation="none")

    # Add title (label) to each subplot (image)
    plt.title("Number {}".format(train_labels[num]))

# Adjusts the spacing between the subplots
plt.tight_layout()


# Provide the depth
train_images = train_images.reshape((60000, 28, 28, 1))
test_images = test_images.reshape((10000, 28, 28, 1))


# Normalize pixel values to be between 0 and 1
train_images = train_images.astype("float32") / 255
test_images = test_images.astype("float32") / 255


# Initialize a sequential model
model = models.Sequential()

# Add the first convolutional layer
model.add(layers.Conv2D(32, (3, 3), activation="relu", input_shape=(28, 28, 1)))

# Add the first MaxPooling layer
model.add(layers.MaxPooling2D((2, 2)))

# Add the second convolutional layer
model.add(layers.Conv2D(64, (3, 3), activation="relu"))

# Add the second MaxPooling layer
model.add(layers.MaxPooling2D((2, 2)))

# Add the third convolutional layer
model.add(layers.Conv2D(64, (3, 3), activation="relu"))

# Flatten the output to feed into a Dense layer
model.add(layers.Flatten())

# Add a fully connected layer and the output layer
model.add(layers.Dense(64, activation="relu"))
model.add(layers.Dense(10, activation="softmax"))


model.compile(
    optimizer="adam",
    loss="sparse_categorical_crossentropy",
    metrics=["accuracy"]
)


model.fit(train_images, train_labels, epochs=5, batch_size=64)

Epoch 1/5
938/938 [==============================] - 45s 47ms/step - loss: 0.1765 - accuracy: 0.9465
Epoch 2/5
938/938 [==============================] - 54s 57ms/step - loss: 0.0487 - accuracy: 0.9848
Epoch 3/5
938/938 [==============================] - 45s 48ms/step - loss: 0.0352 - accuracy: 0.9886
Epoch 4/5
938/938 [==============================] - 45s 48ms/step - loss: 0.0276 - accuracy: 0.9910
Epoch 5/5
938/938 [==============================] - 45s 48ms/step - loss: 0.0218 - accuracy: 0.9925

<keras.src.callbacks.History at 0x78eedb0a5c90>


# Test the model
test_loss, test_acc = model.evaluate(test_images, test_labels)

# Print the accuracy as percentage
print(f"\nTest accuracy: {test_acc * 100}%")

313/313 [==============================] - 3s 8ms/step - loss: 0.0305 - accuracy: 0.9911

Test accuracy: 99.1100013256073%


# Set URL of a PNG image
image_url = "https://raw.githubusercontent.com/pesout/digit-classifier/main/number_gallery/number4.png"


# Download the image
response = requests.get(image_url)
img = Image.open(BytesIO(response.content))


# Display the downloaded image
plt.imshow(img)
plt.title("Original Image")
plt.show()


# Check the mode and convert if necessary
if img.mode != "RGB": img = img.convert("RGB")


# Invert the image colors
img = ImageOps.invert(img)


# Display the inverted image
plt.imshow(img)
plt.title("Inverted Image")
plt.show()


# Resize to 28x28 pixels
img = img.resize((28, 28))


 # Convert to grayscale
img = img.convert("L")


contrast_enhancer = ImageEnhance.Contrast(img)

# Adjust the number to control the level of contrast
img = contrast_enhancer.enhance(4.0)


# Convert to numpy array
img_array = np.array(img)

# Normalize pixel values
img_array = img_array / 255.0

# Reshape for model input
img_array = img_array.reshape(1, 28, 28, 1)


# Display the processed image (from NumPy array)
plt.imshow(img_array[0, :, :, 0], cmap="gray")
plt.title("Processed Image")
plt.show()


# Get probabilities for each class
probabilities = model.predict(img_array)[0]

# Print all class probabilities (probability of each digit)
for i, prob in enumerate(probabilities):
    print(f"Class {i}: Probability {prob:.2%}")

1/1 [==============================] - 0s 135ms/step
Class 0: Probability 0.00%
Class 1: Probability 0.01%
Class 2: Probability 0.00%
Class 3: Probability 0.00%
Class 4: Probability 97.61%
Class 5: Probability 0.00%
Class 6: Probability 0.01%
Class 7: Probability 0.02%
Class 8: Probability 2.35%
Class 9: Probability 0.00%


print("Predicted Class:", np.argmax(probabilities))

Predicted Class: 4


model.save("exported_model.h5") # You can also use the newer .keras format

Handwritten Digit Recognition with Convolutional Neural Networks¶

Importing libraries and modules¶

Training and testing a prediction model on the MNIST datset¶

Loading and understanding the dimensions the MNIST dataset¶

Visualizing the MNIST Dataset¶

Preprocessing the image data¶

Building the Convolutional Neural Network (CNN)¶

Compiling the CNN model¶

Training the CNN model¶

Evaluating the model¶

Predicting the class of an external image¶

Downloading and loading an external image¶

Image preprocessing (1): Color mode and inversion¶

Image preprocessing (2): Resizing, grayscale and contrast¶

Predicting the class¶

Export the model (optional)¶