Main_theano.py

# -*- coding: utf-8 -*-
"""
Created on Mon Mar 28 12:26:06 2016

@author: shengx

Main function
"""

#%%
import numpy as np
import theano
from theano import tensor as T


from Font import *
from utility import *
from NeuralNets import *


basis_size = 50
training_size = 1000
testing_size = 50
generateLetterSets(training_size, testing_size)

inputFont = Font(basis_size,'simsun.ttf') 

trainInput, testInput = inputFont.getLetterSets()

outputFont = Font(basis_size,'simsun.ttf') 

trainOutput, testOutput = outputFont.getLetterSets()


trainInput = np.reshape(trainInput, (basis_size**2 , training_size))
testInput = np.reshape(testInput, (basis_size**2, testing_size))
trainOutput = np.reshape(trainOutput, (basis_size**2, training_size))     #2500*1000
testOutput = np.reshape(testOutput, (basis_size**2, testing_size))

trainInput = trainInput.transpose()
trainOutput = trainOutput.transpose()
trainOutput = trainOutput.flatten()  #1000*2500
trainInput = 1 - trainInput    #?
trainOutput = 1 - trainOutput   #?

testInput = testInput.transpose()
testOutput = testOutput.transpose()   
testOutput = testOutput.flatten() 
testInput = 1 - testInput
testOutput = 1 - testOutput
batch_size = 1

def shared_dataset(data_x, data_y):
    """ Function that loads the dataset into shared variables

    The reason we store our dataset in shared variables is to allow
    Theano to copy it into the GPU memory (when code is run on GPU).
    Since copying data into the GPU is slow, copying a minibatch everytime
    is needed (the default behaviour if the data is not in a shared
    variable) would lead to a large decrease in performance.
    """
    shared_x = theano.shared(np.asarray(data_x, dtype=theano.config.floatX))
    shared_y = theano.shared(np.asarray(data_y, dtype=theano.config.floatX))
    # When storing data on the GPU it has to be stored as floats
    # therefore we will store the labels as ``floatX`` as well
    # (``shared_y`` does exactly that). But during our computations
    # we need them as ints (we use labels as index, and if they are
    # floats it doesn't make sense) therefore instead of returning
    # ``shared_y`` we will have to cast it to int. This little hack
    # lets us get around this issue
    return shared_x, T.cast(shared_y, 'int32')

#testInput, testOutput = shared_dataset(testInput, testOutput)
trainInput, trainOutput = shared_dataset(trainInput, trainOutput)  

   
#%% building neural networks


rng1 = np.random.RandomState(1234)
rng2 = np.random.RandomState(2345)
rng3 = np.random.RandomState(1567)
rng4 = np.random.RandomState(1124)
nkerns = [20, 30]
learning_rate = 0.2


# allocate symbolic variables for the data
index = T.lscalar()  # index to a [mini]batch
x = T.matrix('x')
y = T.ivector('y')

print('...building the model')

layer0_input = x.reshape((batch_size, 1, basis_size, basis_size))

# first convolutional layer
# image original size 50X50, filter size 5X5, filter number nkerns[0]
# after filtering, image size reduced to (50 - 5 + 1) = 46
# after max pooling, image size reduced to 46 / 2 = 23
layer0 = LeNetConvPoolLayer(
        rng1,
        input=layer0_input,
        image_shape=(batch_size, 1, basis_size, basis_size),   # input image shape
        filter_shape=(nkerns[0], 1, 5, 5),
        poolsize=(2, 2)
    )
# second convolutional layer
# input image size 23X23, filter size 4X4, filter number nkerns[1]
# after filtering, image size (23 - 4 + 1) = 20
# after max pooling, image size reduced to 20 / 2 = 10    
layer1 = LeNetConvPoolLayer(
        rng2,
        input=layer0.output,
        image_shape=(batch_size, nkerns[0], 23, 23),
        filter_shape=(nkerns[1], nkerns[0], 4, 4),
        poolsize=(2, 2)
    )
    
layer2_input = layer1.output.flatten(2)

# construct a fully-connected sigmoidal layer
layer2 = HiddenLayer(
        rng3,
        input=layer2_input,
        n_in=nkerns[1] * 10 * 10,
        n_out=400,
        activation=T.nnet.sigmoid
    )
    
layer3 = HiddenLayer(
        rng4,
        input=layer2.output,
        n_in=400,
        n_out=basis_size * basis_size,
        activation=T.nnet.sigmoid
    )    
cost = ((layer3.output - y) ** 2).sum()

params = layer3.params + layer2.params + layer1.params + layer0.params
grads = T.grad(cost, params)

updates = [
        (param_i, param_i - learning_rate * grad_i)
        for param_i, grad_i in zip(params, grads)
    ]
    
#
#test_model = theano.function(
#        inputs = [index],
#        outputs = cost,
#        givens={
#            x: testInput[index * batch_size: (index + 1) * batch_size],
#            y: testOutput[index * batch_size: (index + 1) * batch_size]
#        }
#    )
    
train_model = theano.function(
        inputs = [index],
        outputs = cost,
        updates=updates,
        givens={
            x: trainInput[index : (index + 1) ],
            y: trainOutput[index * basis_size * basis_size: (index + 1) * basis_size * basis_size]
        }
    )    

#%% training the model
    
n_train_batches = 50
n_epochs = 10
epoch = 0

while (epoch < n_epochs):
    epoch = epoch + 1
    for minibatch_index in range(n_train_batches):
        minibatch_avg_cost = train_model(minibatch_index)
        iter = (epoch - 1) * n_train_batches + minibatch_index
        print(('   epoch %i, minibatch %i/%i.') % (epoch, minibatch_index +1, n_train_batches))
        
#test_losses = [test_model(i) for i in range(n_test_batches)]
#test_score = np.mean(test_losses)

#%%
predict_model = theano.function(
        inputs = [x],
        outputs = layer3.output
    )

predicted_values = predict_model(testInput[22:23])


import matplotlib.pyplot as plt
import matplotlib.image as mpimg
output_img = predicted_values
output_img = output_img.reshape(50,50)
output_img = np.asarray(output_img, dtype = 'float64') /256

plt.imshow(output_img)
plt.show()