# Deep Learning sin GPU

Utilizamos Keras para definir una red neuronal que aprenda a clasificar dígitos de la base de datos MNIST.

In [1]:
from keras import layers 
from keras import models
from keras.datasets import mnist
from keras.utils import to_categorical

Using TensorFlow backend.


In [0]:
# Definimos la arquitectura de la red
model = models.Sequential()

# Capa convolucional, kernels de 3x3, 32 filtros, activación relu
model.add(layers.Conv2D(32, (3, 3), activation='relu', input_shape=(28, 28, 1))) 
model.add(layers.MaxPooling2D((2, 2)))

# kernels de 3x3, 64 filtros
model.add(layers.Conv2D(64, (3, 3), activation='relu')) 
model.add(layers.MaxPooling2D((2, 2)))

# kernels de 3x3, 64 filtros
model.add(layers.Conv2D(64, (3, 3), activation='relu'))
model.add(layers.Flatten())

# Capas fully connected. La final utiliza softmax para entregarnos 
# la distribución de probabilidades predicha
model.add(layers.Dense(64, activation='relu'))
model.add(layers.Dense(10, activation='softmax'))

In [3]:
model.summary()

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d_1 (Conv2D)            (None, 26, 26, 32)        320       
_________________________________________________________________
max_pooling2d_1 (MaxPooling2 (None, 13, 13, 32)        0         
_________________________________________________________________
conv2d_2 (Conv2D)            (None, 11, 11, 64)        18496     
_________________________________________________________________
max_pooling2d_2 (MaxPooling2 (None, 5, 5, 64)          0         
_________________________________________________________________
conv2d_3 (Conv2D)            (None, 3, 3, 64)          36928     
_________________________________________________________________
flatten_1 (Flatten)          (None, 576)               0         
_________________________________________________________________
dense_1 (Dense)              (None, 64)                36928     
__________

In [4]:
# Descargamos MNIST
(train_images, train_labels), (test_images, test_labels) = mnist.load_data()

Downloading data from https://s3.amazonaws.com/img-datasets/mnist.npz


In [5]:
# Preprocesamiento de imágenes

train_images = train_images.reshape((60000, 28, 28, 1))
train_images = train_images.astype('float32') / 255

test_images = test_images.reshape((10000, 28, 28, 1))
test_images = test_images.astype('float32') / 255

# Convertimos la clase de cada imagen a un vector con one-hot encoding:
# 0 => [1 0 0 ... 0]
# 1 => [0 1 0 ... 0]
# ...
# 9 => [0 0 0 ... 1]

train_labels = to_categorical(train_labels)
test_labels = to_categorical(test_labels)

# Compilamos el modelo y entrenamos por 5 epocas
model.compile(optimizer='rmsprop',
              loss='categorical_crossentropy',
              metrics=['accuracy'])

model.fit(train_images, train_labels, epochs=5, batch_size=64)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


<keras.callbacks.History at 0x7f3ce441d940>

Tiempo total de ejecución sin GPU:  5 minutos, 28 segundos

In [0]:
# Evaluamos el desempeño sobre el test set
test_loss, test_acc = model.evaluate(test_images, test_labels)
test_acc



0.992

El modelo obtiene una *accuracy* de 0,992.