## Creation and training of the minst model

In [1]:
import numpy as np
from tensorflow import keras
from tensorflow.keras import layers

# Model / data parameters
num_classes = 10
input_shape = (28, 28, 1)

# the data, split between train and test sets
(x_train, y_train), (x_test, y_test) = keras.datasets.mnist.load_data()

# Scale images to the [0, 1] range
x_train = x_train.astype("float32") / 255
x_test = x_test.astype("float32") / 255
# Make sure images have shape (28, 28, 1)
x_train = np.expand_dims(x_train, -1)
x_test = np.expand_dims(x_test, -1)
print("x_train shape:", x_train.shape)
print(x_train.shape[0], "train samples")
print(x_test.shape[0], "test samples")


# convert class vectors to binary class matrices
y_train = keras.utils.to_categorical(y_train, num_classes)
y_test = keras.utils.to_categorical(y_test, num_classes)

model = keras.Sequential(
    [
        keras.Input(shape=input_shape),
        layers.Conv2D(32, kernel_size=(3, 3), activation="relu"),
        layers.MaxPooling2D(pool_size=(2, 2)),
        layers.Conv2D(64, kernel_size=(3, 3), activation="relu"),
        layers.MaxPooling2D(pool_size=(2, 2)),
        layers.Flatten(),
        layers.Dropout(0.5),
        layers.Dense(num_classes, activation="softmax"),
    ]
)

batch_size = 128
epochs = 15

model.compile(loss="categorical_crossentropy", optimizer="adam", metrics=["accuracy"])

model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs, validation_split=0.1)
score = model.evaluate(x_test, y_test, verbose=0)
print("Test loss:", score[0])
print("Test accuracy:", score[1])


x_train shape: (60000, 28, 28, 1)
60000 train samples
10000 test samples
Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15
Test loss: 0.025229280814528465
Test accuracy: 0.9909999966621399


In [8]:
from PIL import Image

In [12]:
y_pred = model.predict_classes(x_test)

In [39]:
#check the shape of the testing image 
x_test.shape

(10000, 28, 28, 1)

# Importing the images created from sudoku_solver.py in the img_r folder

In [58]:
img_path = "img_r/cell_{}_{}.jpg"
array_ret = []
for i in range(1,10,1):
    for j in range(1,10,1):
        img = Image.open(img_path.format(i,j)).convert("L")
        img = np.resize(img, (28,28,1))
        im2arr = np.array(img)
        im2arr = im2arr.reshape(1,28,28,1)
        if np.count_nonzero(im2arr) == 0:
            array_ret.append(0)
        else:
            array_ret.append(model.predict_classes(im2arr)[0])

## Array containg the sudoku (0 = empty cell) 

In [62]:
sudoku = np.array(array_ret)
sudoku = sudoku.reshape((9,9))
sudoku

array([[5, 3, 0, 0, 7, 0, 0, 0, 0],
       [6, 0, 0, 2, 9, 5, 0, 0, 0],
       [0, 9, 8, 0, 0, 0, 0, 8, 0],
       [8, 0, 0, 0, 6, 0, 0, 0, 3],
       [4, 0, 0, 8, 0, 3, 0, 0, 1],
       [7, 0, 0, 0, 2, 0, 0, 0, 5],
       [0, 6, 0, 0, 0, 0, 2, 8, 0],
       [0, 0, 0, 4, 1, 8, 0, 0, 5],
       [0, 0, 0, 0, 8, 0, 0, 7, 9]])