# DeepDream

In [1]:
from keras.applications import inception_v3
from keras import backend as K

Using TensorFlow backend.


In [2]:
K.set_learning_phase(0)

model = inception_v3.InceptionV3(weights='imagenet',
                                 include_top=False)

In [3]:
model.summary()

__________________________________________________________________________________________________
Layer (type)                    Output Shape         Param #     Connected to                     
input_1 (InputLayer)            (None, None, None, 3 0                                            
__________________________________________________________________________________________________
conv2d_1 (Conv2D)               (None, None, None, 3 864         input_1[0][0]                    
__________________________________________________________________________________________________
batch_normalization_1 (BatchNor (None, None, None, 3 96          conv2d_1[0][0]                   
__________________________________________________________________________________________________
activation_1 (Activation)       (None, None, None, 3 0           batch_normalization_1[0][0]      
__________________________________________________________________________________________________
conv2d_2 (

In [4]:
layer_contributions = {
    'mixed2': 0.2,
    'mixed3': 3.,
    'activation_94': 2.,
    'conv2d_93': 0.5,
}

In [5]:
layer_dict = dict([(layer.name, layer) for layer in model.layers])
layer_dict

{'activation_1': <keras.layers.core.Activation at 0x21c87fa25f8>,
 'activation_10': <keras.layers.core.Activation at 0x21c896b7240>,
 'activation_11': <keras.layers.core.Activation at 0x21c8976e240>,
 'activation_12': <keras.layers.core.Activation at 0x21c897b90b8>,
 'activation_13': <keras.layers.core.Activation at 0x21c89892828>,
 'activation_14': <keras.layers.core.Activation at 0x21c8993bc88>,
 'activation_15': <keras.layers.core.Activation at 0x21c899f9f28>,
 'activation_16': <keras.layers.core.Activation at 0x21c89af27b8>,
 'activation_17': <keras.layers.core.Activation at 0x21c89b5e2b0>,
 'activation_18': <keras.layers.core.Activation at 0x21c89c1def0>,
 'activation_19': <keras.layers.core.Activation at 0x21c89d15438>,
 'activation_2': <keras.layers.core.Activation at 0x21c88007940>,
 'activation_20': <keras.layers.core.Activation at 0x21c89d93f28>,
 'activation_21': <keras.layers.core.Activation at 0x21c89ea3f28>,
 'activation_22': <keras.layers.core.Activation at 0x21c89f77278

In [6]:
loss = K.variable(0.)
loss

<tf.Variable 'Variable:0' shape=() dtype=float32_ref>

In [7]:
# keras.backend.prod(x, axis=None, keepdims=False)
# 在某一指定轴，计算张量中的值的乘积。
for layer_name in layer_contributions:
    coeff = layer_contributions[layer_name]
    activation = layer_dict[layer_name].output
    
    scaling = K.prod(K.cast(K.shape(activation), 'float32'))
    loss += coeff * K.sum(K.square(activation[:, 2: -2, 2: -2, :])) / scaling
#WARNING:tensorflow:Variable += will be deprecated. 
#Use variable.assign_add if you want assignment to the variable value or 'x = x + y' if you want a new python Tensor object.



In [11]:
activation

<tf.Tensor 'activation_94/Relu:0' shape=(?, ?, ?, 192) dtype=float32>

In [9]:
activation.shape

TensorShape([Dimension(None), Dimension(None), Dimension(None), Dimension(192)])

In [10]:
activation[:, 2: -2, 2: -2, :]

<tf.Tensor 'strided_slice_4:0' shape=(?, ?, ?, 192) dtype=float32>

In [12]:
activation[:, 2: -2, 2: -2, :].shape

TensorShape([Dimension(None), Dimension(None), Dimension(None), Dimension(192)])

In [25]:
import numpy as np

temp = np.random.random((3, 100, 100, 192))
temp

array([[[[0.77147638, 0.80351985, 0.99897626, ..., 0.74351736,
          0.4552565 , 0.63064187],
         [0.53415717, 0.28003292, 0.06011286, ..., 0.31460366,
          0.889959  , 0.33317639],
         [0.98395711, 0.42135504, 0.03193452, ..., 0.24829896,
          0.17837492, 0.44345865],
         ...,
         [0.13668955, 0.66528979, 0.73227538, ..., 0.67865716,
          0.86261658, 0.06498642],
         [0.46804779, 0.82533401, 0.10023764, ..., 0.36688403,
          0.11589357, 0.70151632],
         [0.35673142, 0.57745301, 0.98621367, ..., 0.49021446,
          0.44692248, 0.25979811]],

        [[0.66853825, 0.09302805, 0.47300475, ..., 0.16254072,
          0.09493468, 0.63980146],
         [0.77329842, 0.92800512, 0.36690145, ..., 0.01137691,
          0.40871647, 0.14683201],
         [0.30637711, 0.65144921, 0.14753353, ..., 0.00817554,
          0.99324109, 0.22662307],
         ...,
         [0.78962846, 0.34463083, 0.6308551 , ..., 0.97801888,
          0.91225285, 0.4

In [26]:
temp[:, 1: -1, 1: -1, :]

array([[[[7.73298421e-01, 9.28005122e-01, 3.66901454e-01, ...,
          1.13769145e-02, 4.08716475e-01, 1.46832007e-01],
         [3.06377112e-01, 6.51449212e-01, 1.47533530e-01, ...,
          8.17553560e-03, 9.93241087e-01, 2.26623074e-01],
         [3.09273536e-01, 8.44162845e-01, 6.94256233e-01, ...,
          7.12814529e-01, 2.27645203e-01, 6.49342385e-01],
         ...,
         [6.67396716e-01, 3.22895169e-01, 9.57252412e-01, ...,
          2.99156459e-01, 7.68465224e-01, 1.97233601e-01],
         [7.89628460e-01, 3.44630826e-01, 6.30855099e-01, ...,
          9.78018882e-01, 9.12252852e-01, 4.94555555e-01],
         [3.89292111e-01, 4.26725012e-01, 3.76672783e-01, ...,
          2.04676649e-01, 6.40629410e-01, 3.48928895e-01]],

        [[6.13609296e-01, 6.81746123e-01, 9.15957097e-01, ...,
          2.33876554e-01, 9.54561351e-01, 5.76034654e-01],
         [4.72226144e-01, 9.24669233e-01, 5.53288327e-01, ...,
          3.94020661e-01, 4.85108082e-01, 9.53218623e-01],
        

In [28]:
temp[:, 2: -2, 2: -2, :].shape

(3, 96, 96, 192)

In [29]:
dream = model.input  #该张量用于保存生成的图像

grads = K.gradients(loss, dream)[0]  #计算损失相对于梦境图像的梯度

grads /= K.maximum(K.mean(K.abs(grads)), 1e-7) #将梯度标准化

outputs = [loss, grads]
fetch_loss_and_grads = K.function([dream], outputs)  #给定一张输出图像 设置一个Keras函数来获取损失值和梯度值

In [30]:
def eval_loss_and_grads(x):
    outs = fetch_loss_and_grads([x])
    loss_value = outs[0]
    grad_values = outs[1]
    return loss_value, grad_values

In [31]:
"""
该函数运行iterations次梯度上升
"""
def gradient_ascent(x, iterations, step, max_loss=None):
    for i in range(iterations):
        loss_value, grad_values = eval_loss_and_grads(x)
        if max_loss is not None and loss_value > max_loss:
            break
        print('...Loss value at', i, ':', loss_value)
        x += step * grad_values
    return x

In [33]:
import scipy
import numpy as np
from keras.preprocessing import image

def resize_img(img, size):
    img = np.copy(img)
    factors = (1,
               float(size[0]) / img.shape[1],
               float(size[1]) / img.shape[2],
               1
              )
    return scipy.ndimage.zoom(img, factors, order=1)

"""
通用函数，将一个张量转换为有效图像
"""
def deprocess_image(x):
    if K.image_data_format() == 'channels_first':
        x = x.reshape((3, x.shape[2], x.shape[3]))
        x = x.transpose((1, 2, 0))
    else:
        x = x.reshape((x.shape[1], x.shape[2], 3))
    x /= 2.
    x += 0.5
    x *= 255
    x = np.clip(x, 0, 255).astype('uint8')
    return x

def save_img(img, fname):
    pil_img = deprocess_image(np.copy(img))
    scipy.misc.imsave(fname, pil_img)

"""
通用函数，用于打开图像、改变图像大小以及将图像格式转换为Inception V3模型能够处理的张量
"""
def preprocess_image(img_path):
    img = image.load_img(img_path)
    img = image.img_to_array(img)
    img = np.expand_dims(img, axis=0)
    img = inception_v3.preprocess_input(img)
    return img

In [34]:
step = 0.02   #梯度上升的步长
num_octave = 3  #运行梯度上升的尺度个数
octave_scale = 1.4  #两个尺度之间的大小比例
iterations = 30  #在每个尺度上运行梯度上升的步数

max_loss = 10.  #如果损失大于10，中断梯度上升过程，避免伪影

base_image_path = 'creative_commons_elephant.jpg'  #图像路径

img = preprocess_image(base_image_path)  #将基础图象加载成numpy数组

original_shape = img.shape[1:3]     #准备一个由形状元组组成的列表，其定义了运行梯度上升的不同尺度
successive_shapes = [original_shape]
for i in range(1, num_octave):
    shape = tuple([int(dim / (octave_scale ** i)) for dim in original_shape])
    print('shape: ', shape)
    successive_shapes.append(shape)

successive_shapes = successive_shapes[::-1]  #将形状列表反转，变为升序

original_img = np.copy(img)
shrunk_original_img = resize_img(img, successive_shapes[0])  #将图像numpy数组的大小缩放到最小尺寸

for shape in successive_shapes:
    print('Processing image shape', shape)
    img = resize_img(img, shape)   #将梦境图像放大
    img = gradient_ascent(img,     #运行梯度上升过程，改变梦境图像
                          iterations=iterations,
                          step=step,
                          max_loss=max_loss)
    upscaled_shrunk_original_img = resize_img(shrunk_original_img, shape) #将原始图像的较小版本放大，它会变得像素化
    same_size_original = resize_img(original_img, shape)  #在这个尺寸上计算原始图像的高质量版本
    lost_detail = same_size_original - upscaled_shrunk_original_img  #二者的差别就是在放大过程中丢失的细节
    
    img += lost_detail  #将丢失的细节重新注入到梦境图像中
    shrunk_original_img = resize_img(original_img, shape)
    #save_img(img, fname='dream_at_scale_' + str(shape) + '.png')

save_img(img, fname='final_dream.png')

shape:  (250, 375)
shape:  (179, 267)
Processing image shape (179, 267)
...Loss value at 0 : 1.1681775
...Loss value at 1 : 1.4419689
...Loss value at 2 : 2.0733752
...Loss value at 3 : 2.6974218
...Loss value at 4 : 3.396371
...Loss value at 5 : 4.09803
...Loss value at 6 : 4.7792854
...Loss value at 7 : 5.387398
...Loss value at 8 : 5.9562354
...Loss value at 9 : 6.623434
...Loss value at 10 : 7.327145
...Loss value at 11 : 7.907139
...Loss value at 12 : 8.590636
...Loss value at 13 : 9.485498
Processing image shape (250, 375)
...Loss value at 0 : 2.6431794
...Loss value at 1 : 3.7386477
...Loss value at 2 : 3.990149
...Loss value at 3 : 5.176982
...Loss value at 4 : 5.7929497
...Loss value at 5 : 5.6096888
...Loss value at 6 : 6.839927
...Loss value at 7 : 7.2192755
...Loss value at 8 : 7.9933596
...Loss value at 9 : 8.696547
...Loss value at 10 : 9.934326
...Loss value at 11 : 9.352362
Processing image shape (351, 525)
...Loss value at 0 : 2.8533874
...Loss value at 1 : 3.989983
..

`imsave` is deprecated in SciPy 1.0.0, and will be removed in 1.2.0.
Use ``imageio.imwrite`` instead.


In [35]:
successive_shapes

[(179, 267), (250, 375), (351, 525)]

In [38]:
#octave_scale = 1.4
for i in range(1, num_octave):
    temp = tuple([int(dim / (octave_scale ** i)) for dim in original_shape])
    print(temp)

(250, 375)
(179, 267)
