In [38]:
import os
import cv2
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import tensorflow as tf
from tensorflow import keras
from tensorflow.keras import layers
from tensorflow.keras import callbacks
from tensorflow.keras.models import Model
from tensorflow.keras.models import load_model

from sklearn.model_selection import train_test_split

import matplotlib.pyplot as plt
%matplotlib inline

In [39]:
print(len(os.listdir("samples")))

1071


In [40]:
import string 

symbols = string.ascii_lowercase + "0123456789"

num_symbols = len(symbols)
img_shape = (50, 200 , 1)

print(num_symbols)

36


In [41]:
def preprocess_data():
    n_samples = len(os.listdir('samples/samples'))
    X = np.zeros((n_samples, 50, 200, 1)) #1071*50*200
    y = np.zeros((5, n_samples, num_symbols)) #5*1070*36
    
    for i, pic in enumerate(os.listdir('samples/samples')):
        img = cv2.imread(os.path.join('samples/samples', pic), cv2.IMREAD_GRAYSCALE)
        pic_target = pic[:-4]
        if len(pic_target) < 6:
            img = img /255.0
            img = np.reshape(img, (50, 200 ,1))
            
            targs = np.zeros((5, num_symbols))
            for j, l in enumerate(pic_target):
                ind = symbols.find(l)
                targs[j, ind] = 1
            X[i] = img
            y[:, i] = targs
            
    return X, y

X, y = preprocess_data()
X_train, y_train = X[:970], y[:, :970]
X_test, y_test = X[970:], y[:, 970:]
        

In [42]:
def create_model():
    img = layers.Input(shape = img_shape)
    
    conv1 = tf.keras.layers.Conv2D(16, (3, 3), padding = 'same', activation = 'relu')(img)
    maxpool1 = tf.keras.layers.MaxPooling2D(padding = 'same')(conv1)
    
    conv2 = tf.keras.layers.Conv2D(32, (3, 3), padding = 'same', activation = 'relu')(maxpool1)
    maxpool2 = tf.keras.layers.MaxPooling2D(padding = 'same')(conv2)
    
    conv3 = tf.keras.layers.Conv2D(32, (3, 3), padding = 'same', activation = 'relu')(maxpool2)
    batch_norm = tf.keras.layers.BatchNormalization()(conv3)
    maxpool3 = tf.keras.layers.MaxPooling2D(padding = 'same')(batch_norm)
    
    flat = tf.keras.layers.Flatten()(maxpool3)
    outs = []
    for _ in range(5):
        dense1 = tf.keras.layers.Dense(64, activation = 'relu')(flat)
        dropout = tf.keras.layers.Dropout(0.5)(dense1)
        dense2 = layers.Dense(num_symbols, activation = 'sigmoid')(dropout)
        
        outs.append(dense2)
        
    model = Model(img, outs)
    model.compile(loss = 'categorical_crossentropy', optimizer = 'adam', metrics = ['accuracy'])
    return model

In [43]:
model = create_model()
model.summary()

Model: "model_3"
__________________________________________________________________________________________________
Layer (type)                    Output Shape         Param #     Connected to                     
input_5 (InputLayer)            [(None, 50, 200, 1)] 0                                            
__________________________________________________________________________________________________
conv2d_12 (Conv2D)              (None, 50, 200, 16)  160         input_5[0][0]                    
__________________________________________________________________________________________________
max_pooling2d_12 (MaxPooling2D) (None, 25, 100, 16)  0           conv2d_12[0][0]                  
__________________________________________________________________________________________________
conv2d_13 (Conv2D)              (None, 25, 100, 32)  4640        max_pooling2d_12[0][0]           
____________________________________________________________________________________________

In [44]:
hist = model.fit(X_train, [y_train[0], y_train[1], y_train[2], y_train[3], y_train[4]], batch_size = 32, epochs = 30, verbose = 1, validation_split = 0.2)

Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30


Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30


Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


In [45]:
def predict(filepath):
    img = cv2.imread(filepath, cv2.IMREAD_GRAYSCALE)
    if img is not None:
        img = img / 255.0
    else:
        print("Image not Detected")
    res = np.array(model.predict(img[np.newaxis, :, :, np.newaxis]))
    ans = np.reshape(res, (5, 36))
    l_ind = []
    probs = []
    for a in ans:
        l_ind.append(np.argmax(a))
        
    capt = ''
    for l in l_ind:
        capt +=symbols[l]
        
    return capt


In [46]:
score = model.evaluate(X_test, [y_test[0], y_test[1], y_test[2], y_test[3], y_test[4]], verbose = 1)
print('Test Loss and accuracy: ', score)

Test Loss and accuracy:  [17.372095108032227, 15.740581512451172, 0.19774363934993744, 0.6200811862945557, 0.5850576162338257, 0.22863321006298065, 0.0, 0.9100000262260437, 0.8600000143051147, 0.8199999928474426, 0.9300000071525574]


In [47]:
model.evaluate(X_test, [y_test[0], y_test[1], y_test[2], y_test[3], y_test[4]])
print(predict('samples/samples/8n5p3.png'))
print(predict('samples/samples/f2m8n.png'))
print(predict('samples/samples/dce8y.png'))
print(predict('samples/samples/3eny7.png'))
print(predict('samples/samples/npxb7.png'))

8n5p3
f2m8n
dce8y
3eny7
mpxf7
