SanDeepLearn

MNIST Multilayer Perceptron

train_x, train_y, dev_x, dev_y, test_x, test_y = get_data(dataset='mnist')

x = T.fmatrix()
y = T.imatrix()
fc1 = FullyConnectedLayer(
    input_dim=train_x.shape[1],
    output_dim=500,
    activation='tanh'
)
fc2 = FullyConnectedLayer(
    input_dim=500,
    output_dim=500,
    activation='tanh'
)
fc3 = FullyConnectedLayer(
    input_dim=500,
    output_dim=10,
    activation='softmax'
)

params = fc1.params + fc2.params + fc3.params
act1 = fc1.fprop(x)
act2 = fc2.fprop(act1)
act3 = fc3.fprop(act2)
loss = T.nnet.categorical_crossentropy(
    act3,
    y
).mean()

print 'Compiling optimization method ...'
updates = Optimizer().sgd(
    loss,
    params,
    lr=0.01
)

print 'Compiling train function ...'
f_train = theano.function(
    inputs=[x, y],
    outputs=loss,
    updates=updates
)

print 'Compiling evaluation function ...'
f_eval = theano.function(
    inputs=[x],
    outputs=act3
)

print 'Training network ...'
for epoch in xrange(10):
    costs = []
    for batch in xrange(0, train_x.shape[0], 24):
        cost = f_train(
            train_x[batch:batch + 24],
            train_y[batch:batch + 24]
        )
        costs.append(cost)
    print 'Epoch %d Training Loss : %.3f ' % (epoch, np.mean(costs))

dev_predictions = f_eval(dev_x)
test_predictions = f_eval(test_x)
print 'Accuracy on dev : %.3f%% ' % (
    100. * (np.argmax(dev_predictions, axis=1) == dev_y).mean()
)
print 'Accuracy on test : %.3f%% ' % (
    100. * (np.argmax(test_predictions, axis=1) == test_y).mean()
)

MNIST Le-Net 5

train_x, train_y, dev_x, dev_y, test_x, test_y = get_data(dataset='mnist')

train_x = train_x.reshape(
    train_x.shape[0],
    1,
    int(np.sqrt(train_x.shape[1])),
    int(np.sqrt(train_x.shape[1]))
)

dev_x = dev_x.reshape(
    dev_x.shape[0],
    1,
    int(np.sqrt(dev_x.shape[1])),
    int(np.sqrt(dev_x.shape[1]))
)
test_x = test_x.reshape(
    test_x.shape[0],
    1,
    int(np.sqrt(test_x.shape[1])),
    int(np.sqrt(test_x.shape[1]))
)

x = T.tensor4()
y = T.imatrix()

convolution_layer0 = Convolution2DLayer(
    input_height=train_x.shape[2],
    input_width=train_x.shape[3],
    filter_width=5,
    filter_height=5,
    num_filters=20,
    num_feature_maps=1,
    flatten=False,
    wide=False
)

convolution_layer1 = Convolution2DLayer(
    input_height=convolution_layer0.output_height_shape,
    input_width=convolution_layer0.output_width_shape,
    filter_width=5,
    filter_height=5,
    num_filters=50,
    num_feature_maps=20,
    flatten=True,
    wide=False
)

fc1 = FullyConnectedLayer(800, 500, activation='tanh')
fc2 = FullyConnectedLayer(500, 10, activation='softmax')

params = convolution_layer0.params + convolution_layer1.params + \
    fc1.params + fc2.params
act1 = convolution_layer0.fprop(x)
act2 = convolution_layer1.fprop(act1)
act3 = fc1.fprop(act2)
act4 = fc2.fprop(act3)
loss = T.nnet.categorical_crossentropy(
    act4,
    y
).mean()

print 'Compiling optimization method ...'
updates = Optimizer().sgd(
    loss,
    params,
    lr=0.01
)

print 'Compiling train function ...'
f_train = theano.function(
    inputs=[x, y],
    outputs=loss,
    updates=updates
)

print 'Compiling evaluation function ...'
f_eval = theano.function(
    inputs=[x],
    outputs=act4
)

print 'Training network ...'
for epoch in xrange(10):
    costs = []
    for batch in xrange(0, train_x.shape[0], 24):
        cost = f_train(
            train_x[batch:batch + 24],
            train_y[batch:batch + 24]
        )
        costs.append(cost)
    print 'Epoch %d Training Loss : %.3f ' % (epoch, np.mean(costs))

dev_predictions = f_eval(dev_x)
test_predictions = f_eval(test_x)
print 'Accuracy on dev : %.3f%% ' % (
    100. * (np.argmax(dev_predictions, axis=1) == dev_y).mean()
)
print 'Accuracy on test : %.3f%% ' % (
    100. * (np.argmax(test_predictions, axis=1) == test_y).mean()
)

Transmembrane helix prediction using Recurrent Neural Networks

x = T.ivector()
y = T.ivector()

emb = EmbeddingLayer(20, 50, name='embedding')
if network == 'rnn':
    rnn = RNN(50, 50, name='rnn')
elif network == 'lstm':
    rnn = LSTM(50, 50, name='lstm')
fc1 = FullyConnectedLayer(50, 1, name='fc')

params = emb.params + rnn.params + \
    fc1.params
embs = emb.fprop(x)
act1 = rnn.fprop(embs)
act2 = fc1.fprop(act1)
loss = ((act2.transpose() - y) ** 2).mean()

print 'Compiling optimization method ...'
updates = Optimizer().sgd(
    loss,
    params,
    lr=0.01
)

print 'Compiling train function ...'
f_train = theano.function(
    inputs=[x, y],
    outputs=loss,
    updates=updates
)

print 'Compiling evaluation function ...'
f_eval = theano.function(
    inputs=[x],
    outputs=act2
)

print 'Training network ...'
for epoch in xrange(10):
    costs = []
    for data_point, labels in zip(train_x, train_y):
        cost = f_train(
            data_point,
            labels
        )
    costs.append(cost)

    print 'Epoch %d Training Loss : %f ' % (epoch, np.mean(costs))

accs = []
for data_point, labels in zip(test_x, test_y):
    preds = f_eval(data_point).squeeze()
    preds = [1 if pred > 0.5 else 0 for pred in preds]
    acc = sum([True if a == b else False for a, b in zip(preds, labels)]) \
        / float(len(preds))
    accs.append(acc)
print 'Testing Accuracy : %f%% ' % (np.mean(accs) * 100.)

Name		Name	Last commit message	Last commit date
Latest commit History 54 Commits
data		data
experiments		experiments
README.md		README.md
attention.py		attention.py
convolution.py		convolution.py
crf.py		crf.py
layer.py		layer.py
optimizers.py		optimizers.py
recurrent.py		recurrent.py
residual.py		residual.py
sequential.py		sequential.py
unit_test.py		unit_test.py
utils.py		utils.py

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

data

data

experiments

experiments

README.md

README.md

attention.py

attention.py

convolution.py

convolution.py

crf.py

crf.py

layer.py

layer.py

optimizers.py

optimizers.py

recurrent.py

recurrent.py

residual.py

residual.py

sequential.py

sequential.py

unit_test.py

unit_test.py

utils.py

utils.py

Repository files navigation

SanDeepLearn

MNIST Multilayer Perceptron

MNIST Le-Net 5

Transmembrane helix prediction using Recurrent Neural Networks

About

Releases

Packages

Languages

MaximumEntropy/SanDeepLearn

Folders and files

Latest commit

History

Repository files navigation

SanDeepLearn

MNIST Multilayer Perceptron

MNIST Le-Net 5

Transmembrane helix prediction using Recurrent Neural Networks

About

Resources

Stars

Watchers

Forks

Languages