# Hand sign classification
### The method of fragmentation

The image is divided into blocks of 20x20. In each block, we calculate the area of contour lying in that block and divide it by the area of that block. If there is no contour, the area is simply zero.

This calculation is performed 400 times and we get 400 features for a single image. 

These features are now trained using the classifiers:
* Deep Learning Neural Network
* KNN

### Fetching data from file

In [21]:
import pandas as pd
import matplotlib.pyplot as plt
import matplotlib.cm as cm
import numpy as np
from sklearn.model_selection import train_test_split as tts
from sklearn.metrics import confusion_matrix

data = pd.read_csv('new_data.csv')
print('Total data parsed: %d'%(len(data)))

no_of_classes = 36
label_indexes = {}
for i in range(10): label_indexes[i] = str(i)
for i in range(26):
    if not chr(ord('a')+i) in ['h','j','v']: label_indexes[10+i] = chr(ord('a')+i)

Total data parsed: 19599


### Deep Learning Neural Network model

In [20]:
from keras.models import Sequential
from keras.layers import Dense, Dropout
from sklearn.preprocessing import LabelEncoder
from sklearn.pipeline import Pipeline
from keras.utils import np_utils
from random import randint

X = data[['f'+str(i) for i in range(400)]].values.tolist()
Y = data['label'].values.tolist()

r_val = randint(1,1000)
print('Random state: %d'%(r_val))
X_train, X_test, Y_train, Y_test = tts(X,Y,test_size=0.3,random_state=r_val)
# 100
encoder = LabelEncoder()
encoder.fit(Y_train)
encoded_train_labels = encoder.transform(Y_train)
dummy_train_labels = np_utils.to_categorical(encoded_train_labels)

encoder = LabelEncoder()
encoder.fit(Y_test)
encoded_test_labels = encoder.transform(Y_test)
dummy_test_labels = np_utils.to_categorical(encoded_test_labels)

model = Sequential()
model.add(Dense(1000, input_dim=400, activation='relu', name='h1'))
model.add(Dense(500, activation='relu', name='h3'))
model.add(Dense(33, activation='softmax', name='op'))

model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
model.fit(X_train,dummy_train_labels,epochs=7,batch_size=32,verbose=1,validation_split=0.3)

score = model.evaluate(X_test,dummy_test_labels)
print("\n%s: %.2f%%" % (model.metrics_names[1], score[1]*100))

Using TensorFlow backend.


Random state: 745
Train on 9603 samples, validate on 4116 samples
Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7

acc: 98.50%


### KNN classifier

In [19]:
from sklearn.neighbors import KNeighborsClassifier
from random import randint
from sklearn.model_selection import KFold

X = data[['f'+str(i) for i in range(400)]].values
Y = data['label'].values

r_val = randint(1,1000)
print('Random state = %3d'%(r_val))
X_train, X_test, Y_train, Y_test = tts(X,Y,test_size=0.3, random_state=351)

print('Training...',end='\r')
classifier = KNeighborsClassifier(n_neighbors=3)
classifier.fit(X_train, Y_train)

print('Testing....',end='\r')
acc = classifier.score(X_test,Y_test)
print('Accuracy: %.3f%' % (acc*100))
print('Approximate incorrect samples: %d/%d'%((1-acc)*len(X_test),len(X_test)))

Random state = 313
Accuracy: 99.303%
Approximate incorrect samples: 40/5880


### Random Forest

In [18]:
from sklearn.ensemble import RandomForestClassifier

X = data[['f'+str(i) for i in range(400)]].values
Y = data['label'].values

r_val = randint(1,1000)
print('Random state = %3d'%(r_val))
X_train, X_test, Y_train, Y_test = tts(X,Y,test_size=0.3, random_state=r_val)

classifier = RandomForestClassifier(n_estimators=100, max_depth=800, random_state=r_val, warm_start=True, max_features='log2')
classifier.fit(X_train, Y_train)

acc = classifier.score(X_test,Y_test)
print('Accuracy: %.3f%%' % (acc*100))
print('Approximate incorrect samples: %d/%d'%((1-acc)*len(X_test),len(X_test)))

Random state = 228
Accuracy: 98.759%
Approximate incorrect samples: 73/5880
