In [33]:
from keras.preprocessing.image import ImageDataGenerator, array_to_img, img_to_array, load_img

datagen = ImageDataGenerator(
        rotation_range=40,
        width_shift_range=0.2,
        height_shift_range=0.2,
        shear_range=0.2,
        zoom_range=0.2,
        horizontal_flip=True,
        fill_mode='nearest')

img = load_img('data/train/cats/cat.0.jpg')  # this is a PIL image
x = img_to_array(img)  # this is a Numpy array with shape (3, 150, 150)
x = x.reshape((1,) + x.shape)  # this is a Numpy array with shape (1, 3, 150, 150)

# the .flow() command below generates batches of randomly transformed images
# and saves the results to the `preview/` directory
i = 0

# je potřeba aby složka preview již existovala. Ve stejné složce, jako je tento notebook
for batch in datagen.flow(x, batch_size=1,
                          save_to_dir='preview', save_prefix='cat', save_format='jpeg'):
    i += 1
    if i > 20:
        break  # otherwise the generator would loop indefinitely

## Vysvětlení k numpy arrays

In [20]:
import numpy as np
a=np.arange(1200)
print(a)

[   0    1    2 ..., 1197 1198 1199]


numpy array ma property "shape", která obsahuje informaci o dimenzích tohoto pole, které jsou uloženy pomocí tuplu.

In [23]:
a.shape

(1200,)

tuply lze spojovat pomocí symbolu +

In [24]:
x=(1,)+(3, 20, 20)
print(x)

(1, 3, 20, 20)


In [26]:
c=a.reshape((1,)+a.shape)
print("a is: ",a)
print("c is: ",c)

a is:  [   0    1    2 ..., 1197 1198 1199]
c is:  [[   0    1    2 ..., 1197 1198 1199]]


In [27]:
print('shape of a is: ',a.shape)
print('shape of c is: ',c.shape)

shape of a is:  (1200,)
shape of c is:  (1, 1200)


Pokud chci z jednorozměrného pole vytvořit třírozměrné, musím si pohlídat dimenze. Součin nových dimenzí se musí rovnat součinu původních dimenzí. 1200=3*20*20

In [28]:
b=a.reshape(3,20,20)
print('shape of b is: ',b.shape)

shape of b is:  (3, 20, 20)


In [29]:
print(b)

[[[   0    1    2 ...,   17   18   19]
  [  20   21   22 ...,   37   38   39]
  [  40   41   42 ...,   57   58   59]
  ..., 
  [ 340  341  342 ...,  357  358  359]
  [ 360  361  362 ...,  377  378  379]
  [ 380  381  382 ...,  397  398  399]]

 [[ 400  401  402 ...,  417  418  419]
  [ 420  421  422 ...,  437  438  439]
  [ 440  441  442 ...,  457  458  459]
  ..., 
  [ 740  741  742 ...,  757  758  759]
  [ 760  761  762 ...,  777  778  779]
  [ 780  781  782 ...,  797  798  799]]

 [[ 800  801  802 ...,  817  818  819]
  [ 820  821  822 ...,  837  838  839]
  [ 840  841  842 ...,  857  858  859]
  ..., 
  [1140 1141 1142 ..., 1157 1158 1159]
  [1160 1161 1162 ..., 1177 1178 1179]
  [1180 1181 1182 ..., 1197 1198 1199]]]


In [31]:
d=b.reshape((1,)+b.shape)
print("shepe of d is: ",d.shape)

shepe of d is:  (1, 3, 20, 20)


In [None]:
from keras.preprocessing.image import ImageDataGenerator
from keras.models import Sequential
from keras.layers import Conv2D, MaxPooling2D
from keras.layers import Activation, Dropout, Flatten, Dense
from keras import backend as K


# dimensions of our images.
img_width, img_height = 150, 150

train_data_dir = 'data/train'
validation_data_dir = 'data/validation'
nb_train_samples = 2000
nb_validation_samples = 800
epochs = 50
batch_size = 16

if K.image_data_format() == 'channels_first':
    input_shape = (3, img_width, img_height)
else:
    input_shape = (img_width, img_height, 3)

model = Sequential()
model.add(Conv2D(32, (3, 3), input_shape=input_shape))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))

model.add(Conv2D(32, (3, 3)))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))

model.add(Conv2D(64, (3, 3)))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))

model.add(Flatten())
model.add(Dense(64))
model.add(Activation('relu'))
model.add(Dropout(0.5))
model.add(Dense(1))
model.add(Activation('sigmoid'))

model.compile(loss='binary_crossentropy',
              optimizer='rmsprop',
              metrics=['accuracy'])

# this is the augmentation configuration we will use for training
train_datagen = ImageDataGenerator(
    rescale=1. / 255,
    shear_range=0.2,
    zoom_range=0.2,
    horizontal_flip=True)

# this is the augmentation configuration we will use for testing:
# only rescaling
test_datagen = ImageDataGenerator(rescale=1. / 255)

train_generator = train_datagen.flow_from_directory(
    train_data_dir,
    target_size=(img_width, img_height),
    batch_size=batch_size,
    class_mode='binary')

validation_generator = test_datagen.flow_from_directory(
    validation_data_dir,
    target_size=(img_width, img_height),
    batch_size=batch_size,
    class_mode='binary')

model.fit_generator(
    train_generator,
    steps_per_epoch=nb_train_samples // batch_size,
    epochs=epochs,
    validation_data=validation_generator,
    validation_steps=nb_validation_samples // batch_size)

model.save_weights('first_try.h5')

Found 24198 images belonging to 3 classes.
Found 802 images belonging to 2 classes.
Epoch 1/50