In [None]:
'''Trains a simple convnet on the MNIST dataset.
Gets to 99.25% test accuracy after 12 epochs
(there is still a lot of margin for parameter tuning).
16 seconds per epoch on a GRID K520 GPU.
'''

from __future__ import print_function
import numpy as np
np.random.seed(1337)  # for reproducibility

from keras.datasets import mnist
from keras.models import Sequential
from keras.layers import Dense, Dropout, Activation, Flatten
from keras.layers import Convolution2D, MaxPooling2D
from keras.utils import np_utils
from keras import backend as K

batch_size = 128
nb_classes = 10
nb_epoch = 12

# input image dimensions
img_rows, img_cols = 28, 28
# number of convolutional filters to use
nb_filters = 32
# size of pooling area for max pooling
pool_size = (2, 2)
# convolution kernel size
kernel_size = (3, 3)

# the data, shuffled and split between train and test sets
(X_train, y_train), (X_test, y_test) = mnist.load_data()

if K.image_dim_ordering() == 'th':
    X_train = X_train.reshape(X_train.shape[0], 1, img_rows, img_cols)
    X_test = X_test.reshape(X_test.shape[0], 1, img_rows, img_cols)
    input_shape = (1, img_rows, img_cols)
else:
    X_train = X_train.reshape(X_train.shape[0], img_rows, img_cols, 1)
    X_test = X_test.reshape(X_test.shape[0], img_rows, img_cols, 1)
    input_shape = (img_rows, img_cols, 1)

X_train = X_train.astype('float32')
X_test = X_test.astype('float32')
X_train /= 255
X_test /= 255
print('X_train shape:', X_train.shape)
print(X_train.shape[0], 'train samples')
print(X_test.shape[0], 'test samples')

# convert class vectors to binary class matrices
Y_train = np_utils.to_categorical(y_train, nb_classes)
Y_test = np_utils.to_categorical(y_test, nb_classes)

model = Sequential()

model.add(Convolution2D(nb_filters, kernel_size[0], kernel_size[1],
                        border_mode='valid',
                        input_shape=input_shape))
model.add(Activation('relu'))
model.add(Convolution2D(nb_filters, kernel_size[0], kernel_size[1]))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=pool_size))
model.add(Dropout(0.25))

model.add(Flatten())
model.add(Dense(128))
model.add(Activation('relu'))
model.add(Dropout(0.5))
model.add(Dense(nb_classes))
model.add(Activation('softmax'))

model.compile(loss='categorical_crossentropy',
              optimizer='adadelta',
              metrics=['accuracy'])

# from keras.callbacks import TensorBoard

# tb = TensorBoard(
#     log_dir='./logs', histogram_freq=0, write_graph=True, write_images=False)

# model.fit(X_train,
#           Y_train,
#           batch_size=batch_size,
#           nb_epoch=nb_epoch,
#           verbose=1,
#           validation_data=(X_test, Y_test),
#           callbacks=[tb])
# score = model.evaluate(X_test, Y_test, verbose=0)
# print('Test score:', score[0])
# print('Test accuracy:', score[1])

In [None]:
from keras.preprocessing.image import ImageDataGenerator, array_to_img, img_to_array
from keras.preprocessing.image import load_img, list_pictures

p = list_pictures('/home/ubuntu/ai/md/imagenesdepolen')[0]
a = load_img(p, target_size=(200,200))

In [None]:


# for p in list_pictures('/home/ubuntu/ai/md/imagenesdepolen'):
#     i = load_img(p)
#     print(float(i.height) / i.width)
    
    
    
    
# sorted(list_pictures('/home/ubuntu/ai/md/imagenesdepolen'),
#        key=lambda p: load_img(p).height/load_img(p).width)    

# '/home/ubuntu/ai/md/imagenesdepolen/anadenanthera_17.jpg',
# '/home/ubuntu/ai/md/imagenesdepolen/anadenanthera_22.jpg',
# '/home/ubuntu/ai/md/imagenesdepolen/anadenanthera_29.jpg',
# '/home/ubuntu/ai/md/imagenesdepolen/anadenanthera_31.jpg',
# '/home/ubuntu/ai/md/imagenesdepolen/anadenanthera_35.jpg',
# '/home/ubuntu/ai/md/imagenesdepolen/arecaceae_04.jpg',
#     ...
# '/home/ubuntu/ai/md/imagenesdepolen/tridax_26.jpg',
# '/home/ubuntu/ai/md/imagenesdepolen/tridax_27.jpg',
# '/home/ubuntu/ai/md/imagenesdepolen/tridax_28.jpg',
# '/home/ubuntu/ai/md/imagenesdepolen/tridax_33.jpg',
# '/home/ubuntu/ai/md/imagenesdepolen/syagrus_32.jpg'

load_img('/home/ubuntu/ai/md/imagenesdepolen/anadenanthera_17.jpg')
# load_img('/home/ubuntu/ai/md/imagenesdepolen/syagrus_32.jpg')

In [None]:
# Poner esto en titanpad/DeepLearning
# Gracias Jesús.
# La verdad que después de leer un poco sobre CNNs, teniendo en cuenta que tenemos pocas imágenes, para entrenar la red y para evitar sobreajuste parece que es conveniente generar nuevas imágenes aplicando ruido a las originales con una técnica que parece llamarse "data augmentation".
# En este sentido estoy por pensar que el hecho de que las imágenes sean de distinto tamaño puede hasta haber sido una afortunada casualidad que nos haga reflexionar sobre el asunto.
# O dicho de otro modo, las que sean cuadradas las podemos coger tal cual y aplicar el redimensionado al tamaño que decidamos para el shape del input, y las que no sean cuadradas las podemos "trocear" en cuadrados.
# Por cierto, en relación a lo que comentabas sobre los posibles frameworks, yo la verdad que he empezado a jugar con Keras (y tensorflow como backend). Lo de tensorflow en lugar de theano era porque me llamada la atención el tensorboard, pero en vano porque en la máquina que hago las pruebas es tan pequeña que parece que se queda sin memoria.

from keras.preprocessing.image import ImageDataGenerator

datagen = ImageDataGenerator(
    rotation_range=40,
    width_shift_range=0.2,
    height_shift_range=0.2,
    rescale=1. / 255,
    shear_range=0.2,
    zoom_range=0.2,
    horizontal_flip=True,
    fill_mode='nearest')

In [106]:
from keras.preprocessing.image import ImageDataGenerator
from keras.preprocessing.image import load_img, list_pictures
from keras.preprocessing.image import array_to_img, img_to_array

# p = list_pictures('/home/ubuntu/ai/md/imagenesdepolen')[0]

# a = load_img('/home/ubuntu/ai/md/imagenesdepolen/anadenanthera_16.jpg')

a = load_img('/home/ubuntu/ai/md/imagenesdepolen/anadenanthera_17.jpg')
# a = load_img('/home/ubuntu/ai/md/imagenesdepolen/syagrus_32.jpg')

In [64]:
# Generador de carpetas de imágenes con train, test, validation 60-20-20
# a partir de las imágenes originales

%matplotlib inline

from keras.preprocessing.image import ImageDataGenerator
from keras.preprocessing.image import load_img, list_pictures
from keras.preprocessing.image import array_to_img, img_to_array
from itertools import groupby
from random import shuffle
import pprint

pp = pprint.PrettyPrinter(indent=0)

# from matplotlib.pyplot import plot

# pictures = list_pictures('/home/ubuntu/ai/md/imagenesdepolen')

def cut_up_picture(p):
    """
    Dada una imagen, si es poco cuadrada
    la devuelve en trozos cuadrados
    """
#     if min(p.size) == max(p)
    l = min(p.size)
    p1 = p.crop((0, 0, l, l))
    p2 = p.crop((p.width - l, p.height - l, p.width, p.height))
    return p1, p2
    
def fold(pictures):
    groups = groupby(pictures, lambda x: x.split("/")[-1].split("_")[0])
    result = {'train':{},'test':{},'validation':{}}
    for k, g in groups:
        g = list(g)
        shuffle(g)
        a = int(round(len(g) * 0.6))
        b = int(round(len(g) * 0.8))
        result['train'][k] = g[:a]
        result['test'][k] = g[a:b]
        result['validation'][k] = g[b:]
    return result

    # a = load_img('/home/ubuntu/ai/md/imagenesdepolen/anadenanthera_16.jpg')

    # a = load_img('/home/ubuntu/ai/md/imagenesdepolen/anadenanthera_17.jpg')
    # a = load_img('/home/ubuntu/ai/md/imagenesdepolen/syagrus_32.jpg')


# n, g = groups.next()
# g = list(g)

# pp.pprint( fold(pictures))

(12.0, 16.0, 20)