# handwriting

[![Open in Colab](https://img.shields.io/badge/Open%20in%20Colab-%23F9AB00.svg?logo=googlecolab&logoColor=white)](https://colab.research.google.com/github/tstaerk/handwriting/blob/main/jupyter-notebook/handwriting.ipynb)

Notebook for handwriting recognition via AI



In [2]:
import os
os.environ["CUDA_VISIBLE_DEVICES"] = "-1"  # Disable GPU

import numpy as np
import matplotlib.pyplot as plt
from tensorflow.keras.datasets import mnist
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, Flatten
from tensorflow.keras.utils import to_categorical


In [None]:
# Load the MNIST dataset
(x_train, y_train), (x_test, y_test) = mnist.load_data()

# Check the shape of the data
print("Training data shape:", x_train.shape)
print("Testing data shape:", x_test.shape)

# Visualize the first training example
#for i in range(4):
#  plt.imshow(x_train[i], cmap='gray')
#  plt.title(f"Label: {y_train[i]}")
#  plt.colorbar()
#  plt.show()


In [None]:
# Normalize pixel values to the range [0, 1]
x_train = x_train / 255.0
x_test = x_test / 255.0

# One-hot encode the labels
y_train = to_categorical(y_train, 10)
y_test = to_categorical(y_test, 10)


In [None]:
# Build the model

from tensorflow.keras import Input

# Define the model with an explicit Input layer
model = Sequential([
    Input(shape=(28, 28)),         # Explicit Input layer
    Flatten(),                     # Flatten the input
    Dense(128, activation='relu'), # Hidden layer with 128 neurons
    Dense(10, activation='softmax') # Output layer with 10 classes
])

# Compile the model
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# Summary of the model
model.summary()


In [None]:
# Train the model
history = model.fit(x_train, y_train, epochs=5, validation_split=0.2)

# Visualize the training process
plt.plot(history.history['accuracy'], label='Training Accuracy')
plt.plot(history.history['val_accuracy'], label='Validation Accuracy')
plt.xlabel('Epochs')
plt.ylabel('Accuracy')
plt.legend()
plt.show()


In [None]:
from tensorflow.keras.utils import to_categorical

# Load MNIST dataset
(x_train, y_train), (x_test, y_test) = mnist.load_data()

# Convert labels to one-hot encoding
y_train = to_categorical(y_train, num_classes=10)
y_test = to_categorical(y_test, num_classes=10)

# Check shapes
print("x_train shape:", x_train.shape)  # Should be (60000, 28, 28)
print("y_train shape:", y_train.shape)  # Should be (60000, 10)


In [None]:
# Check the shapes of the training and test data
print("x_train shape:", x_train.shape)
print("y_train shape:", y_train.shape)

# Check for empty datasets
if x_train.size == 0 or y_train.size == 0:
    raise ValueError("Training data or labels are empty!")

# Ensure the data matches the expected shape
assert len(x_train.shape) == 3, "x_train should have shape (num_samples, 28, 28)"
assert len(y_train.shape) == 2, "y_train should have shape (num_samples, num_classes)"


In [None]:
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Flatten, Dense, Input

# Define the model
model = Sequential([
    Input(shape=(28, 28)),         # Input layer matches x_train shape
    Flatten(),                     # Flatten the 28x28 images
    Dense(128, activation='relu'), # Hidden layer
    Dense(10, activation='softmax') # Output layer matches y_train shape
])

# Compile the model
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# Print model summary
model.summary()


In [None]:
history = model.fit(x_train, y_train, epochs=5, validation_split=0.2)


In [None]:
# Evaluate on the test set
test_loss, test_acc = model.evaluate(x_test, y_test)
print(f"Test Accuracy: {test_acc * 100:.2f}%")


In [None]:
# Predict the labels for the test set
predictions = model.predict(x_test)

# Visualize a test example and its prediction
index =8  # Change this index to test different images
plt.imshow(x_test[index], cmap='gray')
plt.title(f"Predicted: {np.argmax(predictions[index])}, Actual: {np.argmax(y_test[index])}")
plt.show()


In [None]:
model.save("handwriting_model.h5")


In [None]:
from PIL import Image

# Load and preprocess your custom image
img = Image.open('digit.png').convert('L')  # Convert to grayscale
img = img.resize((28, 28))  # Resize to 28x28 pixels
img_array = np.array(img) / 255.0  # Normalize pixel values
img_array = img_array.reshape(1, 28, 28)  # Reshape for the model

# Predict
prediction = model.predict(img_array)
print(f"Predicted Digit: {np.argmax(prediction)}")

# Visualize the input image
plt.imshow(img, cmap='gray')
plt.title("Your Handwritten Digit")
plt.show()
