In [1]:
import os

# use either 'tensorflow' or 'theano'
os.environ['KERAS_BACKEND'] = 'tensorflow'

In [2]:
from keras.models import Input, Model
from keras.layers import Conv1D, Dense, Activation, MaxPool1D, Dropout
from keras.optimizers import Adam
from keras.regularizers import l1_l2
from keras.utils.np_utils import to_categorical
import numpy as np
from sklearn.datasets.samples_generator import make_blobs
import matplotlib.pyplot as plt

Using TensorFlow backend.


In [3]:
def cnn_1d(n_rows, n_cols, n_filters, n_classes, n_pool=1, learning_rate=0.005):
    # the input layer
    data_input = Input(shape=(n_rows, n_cols))

    l1 = 0
    l2 = 1e-4
    coeff_activity = 0.0

    # the filters
    convolution = Conv1D(
        n_filters,
        1,
        activation='relu',
        kernel_regularizer=l1_l2(l1=l1, l2=l2),
        strides=1,
        padding='same',
        name='conv1'
    )(data_input)
    
    #convolution = Dropout(rate=0.5)(convolution)

    #convolution = Activation('relu')(convolution)

    # the cell grouping part
    pooled = MaxPool1D(pool_size=n_pool)(convolution)

    # network prediction output
    output = Dense(
        n_classes,
        activation='softmax',
        kernel_regularizer=l1_l2(l1=l1, l2=l2),
        name='output'
    )(pooled)

    model = Model(inputs=data_input, outputs=output)

    model.compile(
        optimizer=Adam(lr=learning_rate),
        loss='categorical_crossentropy',
        metrics=['accuracy']
    )

    return model

In [4]:
n_features = 2
points_per_feature = 10000
centers = [(2, 2), (4, 4)]

data, labels = make_blobs(
    n_samples=points_per_feature * n_features,
    n_features=n_features,
    centers=centers,
    cluster_std=0.3,
    random_state=5
)

plt.figure(figsize=(2,2))
plt.scatter(data[:, 0], data[:, 1], s=1, alpha=0.3)

<matplotlib.collections.PathCollection at 0x7f7dfc3fdb70>

In [5]:
data[0:3]

array([[ 2.17708414,  1.37538287],
       [ 4.05104876,  3.81916713],
       [ 3.76084191,  4.36784065]])

In [6]:
data.shape

(20000, 2)

In [7]:
# the data need to be in the order:
#   batch size, rows, cols
# So, we first expand to 3-D, then switch the last 2 axes
print(data.shape)
data = np.expand_dims(data, axis=2)
print(data.shape)
data = np.swapaxes(data, 2, 1)
print(data.shape)

(20000, 2)
(20000, 2, 1)
(20000, 1, 2)


In [8]:
labels

array([0, 1, 1, ..., 1, 1, 1])

In [9]:
labels.shape

(20000,)

In [10]:
binary_labels = to_categorical(labels)
binary_labels

array([[ 1.,  0.],
       [ 0.,  1.],
       [ 0.,  1.],
       ..., 
       [ 0.,  1.],
       [ 0.,  1.],
       [ 0.,  1.]])

In [11]:
binary_labels = np.int32(binary_labels)
binary_labels

array([[1, 0],
       [0, 1],
       [0, 1],
       ..., 
       [0, 1],
       [0, 1],
       [0, 1]], dtype=int32)

In [12]:
model = cnn_1d(n_rows=1, n_cols=2, n_filters=5, n_classes=2, n_pool=1, learning_rate=0.1)

In [13]:
model.summary()

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_1 (InputLayer)         (None, 1, 2)              0         
_________________________________________________________________
conv1 (Conv1D)               (None, 1, 5)              15        
_________________________________________________________________
max_pooling1d_1 (MaxPooling1 (None, 1, 5)              0         
_________________________________________________________________
output (Dense)               (None, 1, 2)              12        
Total params: 27
Trainable params: 27
Non-trainable params: 0
_________________________________________________________________


In [15]:
model.fit(
    data, 
    np.expand_dims(binary_labels, axis=1), 
    batch_size=points_per_feature * n_features,
    epochs=100,
    validation_split=0.3,
    verbose=2
)

Train on 14000 samples, validate on 6000 samples
Epoch 1/100
 - 0s - loss: 0.0018 - acc: 1.0000 - val_loss: 0.0018 - val_acc: 1.0000
Epoch 2/100
 - 0s - loss: 0.0018 - acc: 1.0000 - val_loss: 0.0018 - val_acc: 1.0000
Epoch 3/100
 - 0s - loss: 0.0018 - acc: 1.0000 - val_loss: 0.0018 - val_acc: 1.0000
Epoch 4/100
 - 0s - loss: 0.0018 - acc: 1.0000 - val_loss: 0.0018 - val_acc: 1.0000
Epoch 5/100
 - 0s - loss: 0.0018 - acc: 1.0000 - val_loss: 0.0018 - val_acc: 1.0000
Epoch 6/100
 - 0s - loss: 0.0018 - acc: 1.0000 - val_loss: 0.0018 - val_acc: 1.0000
Epoch 7/100
 - 0s - loss: 0.0018 - acc: 1.0000 - val_loss: 0.0018 - val_acc: 1.0000
Epoch 8/100
 - 0s - loss: 0.0018 - acc: 1.0000 - val_loss: 0.0018 - val_acc: 1.0000
Epoch 9/100
 - 0s - loss: 0.0018 - acc: 1.0000 - val_loss: 0.0018 - val_acc: 1.0000
Epoch 10/100
 - 0s - loss: 0.0018 - acc: 1.0000 - val_loss: 0.0018 - val_acc: 1.0000
Epoch 11/100
 - 0s - loss: 0.0018 - acc: 1.0000 - val_loss: 0.0018 - val_acc: 1.0000
Epoch 12/100
 - 0s - loss

<keras.callbacks.History at 0x7f7df85938d0>

In [16]:
test_data = np.array(
    [
        [2, 2], [4, 4], [3, 3], [2.0, 4.0], [2.5, 2.5]
    ]
)

model.predict(np.expand_dims(test_data, 1))

array([[[  9.99895453e-01,   1.04542880e-04]],

       [[  2.00479280e-05,   9.99979973e-01]],

       [[  4.65345770e-01,   5.34654200e-01]],

       [[  4.44155514e-01,   5.55844486e-01]],

       [[  9.94515955e-01,   5.48397936e-03]]], dtype=float32)