In [1]:
# !pip install tensorflow
# !pip install keras
import numpy as np
from keras import layers
from keras.layers import Input, Add, Dense, Activation, ZeroPadding2D, BatchNormalization, Dropout, concatenate, Flatten, UpSampling2D,Conv2D, AveragePooling2D, MaxPooling2D, GlobalMaxPooling2D
from keras.models import Model, load_model
from keras.preprocessing import image
from keras.utils import layer_utils
from keras.utils.data_utils import get_file
from keras.applications.imagenet_utils import preprocess_input
from IPython.display import SVG
from keras.utils.vis_utils import model_to_dot
from keras.initializers import glorot_uniform
import scipy.misc
import matplotlib.pyplot as plt
from matplotlib.pyplot import imshow
import copy, pickle
from tensorflow.keras.optimizers import Adam
%matplotlib inline

import keras.backend as K
K.set_image_data_format('channels_last')
K.set_learning_phase(1)




In [2]:
INPUT_FEATURES = ['elevation', 'th', 'vs',  'tmmn', 'tmmx', 'sph', 
                  'pr', 'pdsi', 'NDVI', 'population', 'erc', 'PrevFireMask']
which_features = ['PrevFireMask', 'NDVI', 'elevation', 'tmmx', 'tmmn']
which_features = INPUT_FEATURES.copy()
which_idx = [INPUT_FEATURES.index(f) for f in which_features]
which_idx


[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11]

In [3]:
X_train = np.load('X_train_final.npy')
Y_train = np.load('Y_train_final.npy')

X_test = np.load('X_val.npy')
Y_test = np.load('Y_val.npy')

X_test_metrics = np.load('X_test.npy')
Y_test_metrics = np.load('Y_test.npy')




In [4]:
# X_train = X_train[:,:,:,which_idx]

In [5]:
X_train.shape

(10836, 32, 32, 12)

In [6]:
Y_train.shape

(10836, 32, 32)

In [7]:
[m, n_h, n_w, n_c] = X_train.shape
m, n_h, n_w, n_c



(10836, 32, 32, 12)

In [8]:

# X_test = X_test[:,:,:,which_idx]


In [9]:
X_test.shape



(1404, 32, 32, 12)

In [10]:
X_test_metrics.shape

(1362, 32, 32, 12)

In [11]:
Y_train = np.where(Y_train == -1, 0, Y_train)
Y_test = np.where(Y_test == -1, 0, Y_test)

In [17]:
def dice_coef(y_true, y_pred, smooth=1):
    y_true_f = K.flatten(y_true)
    y_pred_f = K.flatten(y_pred)
    intersection = K.sum(y_true_f * y_pred_f)
    return (2. * intersection + smooth) / (K.sum(y_true_f) + K.sum(y_pred_f) + smooth)

In [13]:
epochs = 64
learning_rate = 0.001
dropout_rate = 0.1
batch_size = 64

In [27]:
def model_arch(learning_rate, dropout_rate, batch_size, epochs = 32):

    # Contraction Path
    s = 1

    X = Input((n_h, n_w, n_c))

    c1 = Conv2D(16, (3,3), strides =(s,s), padding='same', activation = 'relu', kernel_initializer = 'he_normal')(X)
    c1 = Dropout(dropout_rate)(c1)
    c1 = Conv2D(16, (3,3), strides =(s,s), padding = 'same', activation='relu', kernel_initializer = 'he_normal')(c1)
    c1 = BatchNormalization(axis=3)(c1)
    c1 = Activation('relu')(c1)
    p1 = MaxPooling2D((2,2))(c1)

    c2 = Conv2D(32, (3,3), strides =(s,s), padding='same', activation = 'relu', kernel_initializer = 'he_normal')(p1)
    c2 = Dropout(dropout_rate)(c2)
    c2 = Conv2D(32, (3,3), strides =(s,s), padding = 'same', kernel_initializer = 'he_normal')(c2)
    c2 = BatchNormalization(axis=3)(c2)
    c2 = Activation('relu')(c2)
    p2 = MaxPooling2D((2,2))(c2)

    c3 = Conv2D(64, (3,3), strides =(s,s), padding='same', activation = 'relu', kernel_initializer = 'he_normal')(p2)
    c3 = Dropout(dropout_rate)(c3)
    c3 = Conv2D(64, (3,3), strides =(s,s), padding = 'same', kernel_initializer = 'he_normal')(c3)
    c3 = BatchNormalization(axis=3)(c3)
    c3 = Activation('relu')(c3)
    p3 = MaxPooling2D((2,2))(c3)

    c4 = Conv2D(128, (3,3), activation='relu', padding='same', kernel_initializer='he_normal')(p3)
    c4 = Dropout(dropout_rate)(c4)
    c4 = Conv2D(128, (3,3), padding='same', kernel_initializer='he_normal')(c4)
    c4 = BatchNormalization(axis=3)(c4)
    c4 = Activation('relu')(c4)  

     # Expansion path
    u5 = UpSampling2D(size = (2,2))(c4)
    u5 = concatenate([u5, c3])
    c5 = Conv2D(64, (3,3), activation='relu', kernel_initializer='he_normal', padding='same')(u5)
    c5 = Dropout(dropout_rate)(c5)
    c5 = Conv2D(64, (3,3), kernel_initializer='he_normal', padding='same')(c5)
    c5 = BatchNormalization(axis=3)(c5)
    c5 = Activation('relu')(c5)                                                                        

    u6 = UpSampling2D(size = (2,2))(c5)
    u6 = concatenate([u6, c2])
    c6 = Conv2D(32, (3,3), activation='relu', kernel_initializer='he_normal', padding='same')(u6)
    c6 = Dropout(dropout_rate)(c6)
    c6 = Conv2D(32, (3,3), kernel_initializer='he_normal', padding='same')(c6)
    c6 = BatchNormalization(axis=3)(c6)
    c6 = Activation('relu')(c6) 

    u7 = UpSampling2D(size = (2,2))(c6)
    u7 = concatenate([u7, c1])
    c7 = Conv2D(16, (3,3), activation='relu', kernel_initializer='he_normal', padding='same')(u7)
    c7 = Dropout(dropout_rate)(c7)
    c7 = Conv2D(16, (3,3), kernel_initializer='he_normal', padding='same')(c7)
    c7 = BatchNormalization(axis=3)(c7)
    c7 = Activation('relu')(c7)                                                                        

    outputs = Conv2D(1, (1,1), activation = 'sigmoid')(c7)

    model = Model(inputs = X, outputs = outputs)
    
    decay_rate = learning_rate/epochs
    opt = Adam(learning_rate=learning_rate, beta_1=0.9, beta_2=0.999, epsilon=1e-8, decay=decay_rate, amsgrad=False)

    model.compile(optimizer=opt, loss='binary_crossentropy', metrics=[dice_coef])

    history = model.fit(X_train, Y_train, epochs = epochs, batch_size = batch_size)
    loss, dice_coef2 = model.evaluate(X_test, Y_test)
    
    loss_test, dice_coef2_test = model.evaluate(X_test_metrics, Y_test_metrics)
    
    return history, loss, dice_coef2, loss_test, dice_coef2_test



In [28]:
results = {}



In [None]:

for l, learning_rate in enumerate([0.001, 0.01, 0.05]):
    for d, dropout_rate in enumerate([0.1]):
        for b, batch_size in enumerate([32]):
            temp = {}
            history, loss, dice_coef2, loss_test, dice_coef2_test = model_arch(learning_rate, dropout_rate, batch_size, epochs = 32)
            temp['history'] = history
            temp['loss'] = loss
            temp['dice_coef'] = dice_coef2
            results['learning_'+str(learning_rate)+'_dropout_'+str(dropout_rate)+'_batch_size_'+str(batch_size)] = temp
            del temp, history, loss, dice_coef2

    

Epoch 1/32
Epoch 2/32
Epoch 3/32
Epoch 4/32
Epoch 5/32
Epoch 6/32
Epoch 7/32
Epoch 8/32
Epoch 9/32
Epoch 10/32
Epoch 11/32
Epoch 12/32
Epoch 13/32
Epoch 14/32
Epoch 15/32
Epoch 16/32
Epoch 17/32
Epoch 18/32
Epoch 19/32
Epoch 20/32
Epoch 21/32
Epoch 22/32
Epoch 23/32
Epoch 24/32
Epoch 25/32
Epoch 26/32
Epoch 27/32
Epoch 28/32
Epoch 29/32
Epoch 30/32
Epoch 31/32
Epoch 32/32
Epoch 1/32
Epoch 2/32
Epoch 3/32

In [None]:

for l, learning_rate in enumerate([0.001]):
    for d, dropout_rate in enumerate([0.1]):
        for b, batch_size in enumerate([16, 32, 64]):
            temp = {}
            history, loss, dice_coef2 = model_arch(learning_rate, dropout_rate, batch_size, epochs = 32)
            temp['history'] = history
            temp['loss'] = loss
            temp['dice_coef'] = dice_coef2
            results['learning_'+str(learning_rate)+'_dropout_'+str(dropout_rate)+'_batch_size_'+str(batch_size)] = temp
            del temp, history, loss, dice_coef2

    

In [None]:

for l, learning_rate in enumerate([0.001]):
    for d, dropout_rate in enumerate([0.05, 0.1, 0.2]):
        for b, batch_size in enumerate([64]):
            temp = {}
            history, loss, dice_coef2 = model_arch(learning_rate, dropout_rate, batch_size, epochs = 32)
            temp['history'] = history
            temp['loss'] = loss
            temp['dice_coef'] = dice_coef2
            results['learning_'+str(learning_rate)+'_dropout_'+str(dropout_rate)+'_batch_size_'+str(batch_size)] = temp
            del temp, history, loss, dice_coef2

    

In [None]:
pickle.dump(results, open('results_alpha.pkl', 'wb'))



In [None]:
print(history.history.keys())
plt.figure(figsize=(12,6))
plt.subplot(121)
plt.plot(history.history['loss'])
plt.xlabel('Epoch')
plt.ylabel('Binary Crossentropy Loss')
plt.title('Loss')
plt.subplot(122)
plt.plot(history.history['dice_coef'])
plt.xlabel('Epoch')
plt.ylabel('Dice Coefficient')
plt.title('Dice Coefficient')
plt.suptitle('Epochs = 64, Learning Rate = 0.01, Adam Optimizer')


In [None]:
x = X_test[1122,:,:,:]
x = np.expand_dims(x, axis=0)
y = model.predict(x)
y = np.where(y>0.3, 1, 0)

In [None]:
def plot_examples(i):
    x = X_test[i,:,:,:]
    x = np.expand_dims(x, axis=0)
    y = model.predict(x)
    y = np.where(y>0.5, 1, 0)
    plt.figure(figsize = (20,6))
    plt.subplot(131)
    plt.imshow(X_test[i,:,:,11])
    plt.colorbar()
    plt.subplot(132)
    plt.imshow(Y_test[i,:,:])
    plt.colorbar()
    plt.subplot(133)
    plt.imshow(y[0,:,:,0])
    plt.colorbar()
    plt.clim([0,1])

In [None]:
plot_examples(399)

In [None]:
Y_train = np.where(Y_train==-1, -1, 0)

In [None]:
np.where(Y_train==-1)