In [2]:
from keras.datasets import cifar10
(X_train, y_train), (X_test, y_test) = cifar10.load_data()

Using TensorFlow backend.


Downloading data from https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz


In [0]:
# y_train.shape is 2d, (50000, 1). While Keras is smart enough to handle this
# it's a good idea to flatten the array.
y_train = y_train.reshape(-1)
y_test = y_test.reshape(-1)

In [0]:
from sklearn.model_selection import train_test_split
X_train, X_valid, y_train, y_valid = train_test_split(X_train, y_train, test_size=0.3, random_state=42, stratify = y_train)

In [0]:
import numpy as np
##Converting Image to grayscale
X_train = np.sum(X_train/3, axis=3, keepdims=True)
X_valid = np.sum(X_valid/3, axis=3, keepdims=True)
X_test  = np.sum(X_test/3, axis=3, keepdims=True)

In [0]:
##Normalizing the images between 0 and 1
X_train = (X_train - 128)/128 
X_test= (X_test - 128)/128
X_valid=(X_valid-128)/128



In [0]:
import tensorflow as tf

EPOCHS = 40
BATCH_SIZE = 128

In [0]:
### Define your architecture here.
from tensorflow.contrib.layers import flatten

def LeNet(x):    
    # Arguments used for tf.truncated_normal, randomly defines variables for the weights and biases for each layer
    mu = 0
    sigma = 0.1
    
    #Layer 1: Convolutional. Input = 32x32x1. Output = 28x28x6.
    conv1_W = tf.Variable(tf.truncated_normal(shape=(5, 5, 1, 6), mean = mu, stddev = sigma))
    conv1_b = tf.Variable(tf.zeros(6))
    conv1   = tf.nn.conv2d(x, conv1_W, strides=[1, 1, 1, 1], padding='VALID') + conv1_b
    conv1   = tf.nn.relu(conv1)

    #Pooling. Input = 28x28x6. Output = 14x14x6.
    conv1 = tf.nn.max_pool(conv1, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='VALID')

    #Layer 2: Convolutional. Output = 10x10x16.
    conv2_W = tf.Variable(tf.truncated_normal(shape=(5, 5, 6, 16), mean = mu, stddev = sigma))
    conv2_b = tf.Variable(tf.zeros(16))
    conv2   = tf.nn.conv2d(conv1, conv2_W, strides=[1, 1, 1, 1], padding='VALID') + conv2_b
    
    #Activation.
    conv2 = tf.nn.relu(conv2)
    x_1   = flatten(conv2) #Shape: 1600

    #Pooling. Input = 10x10x16. Output = 5x5x16.
    conv2 = tf.nn.max_pool(conv2, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='VALID')
   
    #Layer 3: Convolutional. Output = 3x3x32.
    conv3_W = tf.Variable(tf.truncated_normal(shape=(3, 3, 16, 32), mean = mu, stddev = sigma))
    conv3_b = tf.Variable(tf.zeros(32))
    conv3   = tf.nn.conv2d(conv2, conv3_W, strides=[1, 1, 1, 1], padding='VALID') + conv3_b
    conv3   = tf.nn.relu(conv3)
   
    #Flatten. Input = 3x3x32. Output = 288.
    x_2   = flatten(conv3)
    
    final_fc=tf.concat([x_1, x_2], 1)  #shape: 288+1600=1888
    final_fc=tf.nn.dropout(final_fc,keep_prob)
    # SOLUTION: Layer 3: Fully Connected. Input = 1888. Output = 1024.
    fc1_W = tf.Variable(tf.truncated_normal(shape=(1888, 1024), mean = mu, stddev = sigma))
    fc1_b = tf.Variable(tf.zeros(1024))
    fc1   = tf.matmul(final_fc, fc1_W) + fc1_b
    
    # SOLUTION: Activation.
    fc1    = tf.nn.relu(fc1)

    # SOLUTION: Layer 4: Fully Connected. Input = 1024. Output = 512.
    fc2_W  = tf.Variable(tf.truncated_normal(shape=(1024, 512), mean = mu, stddev = sigma))
    fc2_b  = tf.Variable(tf.zeros(512))
    fc2    = tf.matmul(fc1, fc2_W) + fc2_b
    
    # SOLUTION: Activation.
    fc2    = tf.nn.relu(fc2)

    # SOLUTION: Layer 5: Fully Connected. Input = 512. Output = 10.
    fc3_W  = tf.Variable(tf.truncated_normal(shape=(512, 10), mean = mu, stddev = sigma))
    fc3_b  = tf.Variable(tf.zeros(10))
    logits = tf.matmul(fc2, fc3_W) + fc3_b
    
    return logits

In [0]:
x = tf.placeholder(tf.float32, (None, 32, 32,1))
y = tf.placeholder(tf.int32, (None))
keep_prob=tf.placeholder(tf.float32)
one_hot_y = tf.one_hot(y,10)



In [0]:
rate = 0.001

logits = LeNet(x)
cross_entropy = tf.nn.softmax_cross_entropy_with_logits(labels=one_hot_y, logits=logits)
loss_operation = tf.reduce_mean(cross_entropy)
optimizer = tf.train.AdamOptimizer(learning_rate = rate)
training_operation = optimizer.minimize(loss_operation)

In [0]:
correct_prediction = tf.equal(tf.argmax(logits, 1), tf.argmax(one_hot_y, 1))
accuracy_operation = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
saver = tf.train.Saver()

def evaluate(X_data, y_data):
    num_examples = len(X_data)
    total_accuracy = 0
    sess = tf.get_default_session()
    for offset in range(0, num_examples, BATCH_SIZE):
        batch_x, batch_y = X_data[offset:offset+BATCH_SIZE], y_data[offset:offset+BATCH_SIZE]
        accuracy = sess.run(accuracy_operation, feed_dict={x: batch_x, y: batch_y, keep_prob:1})
        total_accuracy += (accuracy * len(batch_x))
    return total_accuracy / num_examples

In [28]:
from sklearn.utils import shuffle
with tf.Session() as sess:
    #tf.initialize_all_variables().run()
    sess.run(tf.global_variables_initializer())
    #saver.restore(sess, tf.train.latest_checkpoint('.'))
    num_examples = len(X_train)
    accuracy=[]
    print("Training...")
    print()
    for i in range(EPOCHS):
        X_train, y_train = shuffle(X_train, y_train)
        for offset in range(0, num_examples, BATCH_SIZE):
            end = offset + BATCH_SIZE
            batch_x, batch_y = X_train[offset:end], y_train[offset:end]
            sess.run(training_operation, feed_dict={x: batch_x, y: batch_y,keep_prob:0.5})
            
        validation_accuracy = evaluate(X_valid, y_valid)
        print("EPOCH {} ...".format(i+1))
        print("Validation Accuracy = {:.3f}".format(validation_accuracy))
        print()
        accuracy.append(validation_accuracy)
        if i==0:
          continue
        if(np.amax(accuracy)<=validation_accuracy):
            saver.save(sess, '~/CIFAR-10 Lenet/model')
            print("Model saved")
        

Training...

EPOCH 1 ...
Validation Accuracy = 0.454

EPOCH 2 ...
Validation Accuracy = 0.512

Model saved
EPOCH 3 ...
Validation Accuracy = 0.520

Model saved
EPOCH 4 ...
Validation Accuracy = 0.562

Model saved
EPOCH 5 ...
Validation Accuracy = 0.594

Model saved
EPOCH 6 ...
Validation Accuracy = 0.596

Model saved
EPOCH 7 ...
Validation Accuracy = 0.614

Model saved
EPOCH 8 ...
Validation Accuracy = 0.617

Model saved
EPOCH 9 ...
Validation Accuracy = 0.630

Model saved
EPOCH 10 ...
Validation Accuracy = 0.620

EPOCH 11 ...
Validation Accuracy = 0.632

Model saved
EPOCH 12 ...
Validation Accuracy = 0.628

EPOCH 13 ...
Validation Accuracy = 0.630

EPOCH 14 ...
Validation Accuracy = 0.627

EPOCH 15 ...
Validation Accuracy = 0.627

EPOCH 16 ...
Validation Accuracy = 0.635

Model saved
EPOCH 17 ...
Validation Accuracy = 0.621

EPOCH 18 ...
Validation Accuracy = 0.633

EPOCH 19 ...
Validation Accuracy = 0.629

EPOCH 20 ...
Validation Accuracy = 0.630

EPOCH 21 ...
Validation Accuracy = 0