In [1]:
import pandas as pd
import numpy as np

from sklearn.svm import SVC
from sklearn.model_selection import GridSearchCV
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score

## Images:
from skimage.transform import resize
from skimage.io import imread

import os
import matplotlib.pyplot as plt

import pickle

In [2]:
datadir = 'images/'
categories = ['ChickenHead', 'ElephantHead']

flat_data_arr = []
target_arr = []

for i in categories:
    print ('loading... category: ', i)
    path = os.path.join (datadir, i)
    for img in os.listdir (path):
        img_array = imread (os.path.join (path, img))
        img_resized = resize (img_array, (150, 150, 3))
        flat_data_arr.append (img_resized.flatten())
        target_arr.append (categories.index(i))
    print ("loaded category ", i, "successfully")        

loading... category:  ChickenHead
loaded category  ChickenHead successfully
loading... category:  ElephantHead
loaded category  ElephantHead successfully


In [3]:
flat_data = np.array (flat_data_arr)
target = np.array (target_arr)

df = pd.DataFrame (flat_data)
df['Target'] = target

df.head()

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,...,67491,67492,67493,67494,67495,67496,67497,67498,67499,Target
0,0.258824,0.258824,0.219608,0.231373,0.231373,0.192157,0.168627,0.168627,0.129412,0.180392,...,0.321569,0.321569,0.290196,0.301961,0.301961,0.270588,0.290196,0.290196,0.258824,0
1,0.121569,0.227451,0.105882,0.129412,0.227451,0.113725,0.176471,0.254902,0.14902,0.219608,...,0.784314,0.670588,0.513725,0.772549,0.658824,0.501961,0.768627,0.654902,0.498039,0
2,0.415686,0.698039,0.258824,0.384314,0.666667,0.235294,0.34902,0.619608,0.203922,0.321569,...,0.423529,0.615686,0.266667,0.435294,0.627451,0.270588,0.380392,0.572549,0.215686,0
3,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0
4,0.784314,0.729412,0.623529,0.776471,0.721569,0.615686,0.737255,0.682353,0.576471,0.690196,...,0.717647,0.643137,0.517647,0.72549,0.65098,0.52549,0.721569,0.647059,0.521569,0


In [59]:
X = df.values[:, :-1]
Y = df.values[:, -1]

x_train, x_test, y_train, y_test = train_test_split (X, Y, test_size=0.2, random_state=47)

In [5]:
param_grid = {'C': [10, 100], 'gamma': [0.0001, 0.001, 0.1, 1, 10], 'kernel': ['rbf']}
svc1 = SVC()

svc = GridSearchCV (svc1, param_grid)
svc.fit (x_train, y_train)

GridSearchCV(estimator=SVC(),
             param_grid={'C': [10, 100], 'gamma': [0.0001, 0.001, 0.1, 1, 10],
                         'kernel': ['rbf']})

In [6]:
print (svc.best_params_)
ypred_train = svc.predict (x_train)
ypred_test = svc.predict (x_test)

print ('Train Accuracy: ', accuracy_score (ypred_train, y_train))
print ('Test Accuracy: ', accuracy_score (ypred_test, y_test))

{'C': 10, 'gamma': 0.0001, 'kernel': 'rbf'}
Train Accuracy:  1.0
Test Accuracy:  0.9


In [7]:
from sklearn.ensemble import AdaBoostClassifier

ab = AdaBoostClassifier(n_estimators = 9)
ab.fit(x_train, y_train)
y_pred3 = ab.predict(x_test)
print('Accuracy =', accuracy_score(y_pred3, y_test))

Accuracy = 0.925


In [65]:
from sklearn.neighbors import KNeighborsClassifier

knn = KNeighborsClassifier (n_neighbors = 4)
knn.fit (x_train, y_train)
y_pred2 = knn.predict (x_test)
print('max accuracy: ', accuracy_score (y_pred2, y_test))

max accuracy:  0.875


  mode, _ = stats.mode(_y[neigh_ind, k], axis=1)


In [23]:
from sklearn.neural_network import MLPClassifier
r = MLPClassifier (hidden_layer_sizes = (5, 16), activation='relu')
r.fit (x_train, y_train)
yp_test = r.predict (x_test)
print ('Test Accuracy: ', accuracy_score (yp_test, y_test))

Test Accuracy:  0.95


In [10]:
from sklearn.ensemble import RandomForestClassifier

rf = RandomForestClassifier(n_estimators = 10)
rf.fit(x_train, y_train)
y_pred1 = rf.predict(x_test)
print('Accuracy =', accuracy_score(y_pred1, y_test))

Accuracy = 0.975


In [11]:
y_train[y_train == 0] = -1
y_test[y_test == 0] = -1

In [58]:
from sklearn.ensemble import AdaBoostClassifier

ab = AdaBoostClassifier(n_estimators = 9)
ab.fit(x_train, y_train)
y_pred3 = ab.predict(x_test)
print('Accuracy =', accuracy_score(y_pred3, y_test))

Accuracy = 0.925


In [24]:
pickle.dump (svc, open('SVCModel.p', 'wb'))
pickle.dump (rf, open('randomForestModel.p', 'wb'))
pickle.dump (knn, open('KNNModel.p', 'wb'))
pickle.dump (ab, open('adaBoostModel.p', 'wb'))
pickle.dump (r, open('neuralNetworkModel.p', 'wb'))

In [25]:
svc = pickle.load (open('SVCModel.p', 'rb'))
rf = pickle.load (open('randomForestModel.p', 'rb'))
knn = pickle.load (open('KNNModel.p', 'rb'))
ab = pickle.load (open('adaBoostModel.p', 'rb'))
r = pickle.load (open('neuralNetworkModel.p', 'rb'))

In [51]:
filename = 'chicken3.jpg'

img_array = imread (filename)
img_resized = resize (img_array, (150, 150, 3))
test_data = np.array (img_resized.flatten())
test_data = test_data.reshape(1, -1)
print (test_data.shape)

(1, 67500)


In [52]:
p = svc.predict (test_data)
if p==0: print ('Chicken')
else: print ('Elephant')

Chicken


In [53]:
p = rf.predict (test_data)
if p==0: print ('Chicken')
else: print ('Elephant')

Chicken


In [54]:
p = knn.predict (test_data)
if p==0: print ('Chicken')
else: print ('Elephant')

Elephant


  mode, _ = stats.mode(_y[neigh_ind, k], axis=1)


In [55]:
p = ab.predict (test_data)
if p==0: print ('Chicken')
else: print ('Elephant')

Elephant


In [56]:
p = r.predict (test_data)
if p==0: print ('Chicken')
else: print ('Elephant')

Chicken
