In [1]:
import pandas as pd 
import numpy as np

from time import sleep
from tqdm import tqdm

from keras.callbacks import EarlyStopping
from keras.models import Sequential
from keras.layers import Dense
from keras.layers import Dropout
from keras.datasets import mnist

from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

from keras.applications.vgg16 import preprocess_input
from keras.applications.vgg16 import VGG16

import matplotlib.pyplot as plt
%matplotlib inline

In [2]:
def add_padding(dataset=None, pad_width = 0, constant_values=0) -> []:
    padded_dataset = []
    
    for i in dataset:
        padded = np.pad(i, pad_width=pad_width, mode='constant', constant_values=constant_values)
        padded_dataset.append(padded[:, :, np.newaxis])
    
    return padded_dataset

def extract_features(dataset):
    features = []

    for x in tqdm(dataset):
        p = np.repeat(x, 3, axis=-1)
        p = preprocess_input(p)
        predict = np.expand_dims(p, axis=0)
        predict = model.predict(predict)
        features.append(predict[0][0][0])
    
    return features
    
def write_matrix_to_file(matrix=None, file_name="random.txt"):
    with open(file_name, 'wb') as f:
        for line in matrix:
            np.savetxt(f, line, delimiter=' ')

In [3]:
(x_train, y_train), (x_test, y_test) = mnist.load_data()

new_x_train = add_padding(x_train, pad_width=2, constant_values=0)
new_x_test = add_padding(x_test, pad_width=2, constant_values=0)

In [4]:
model = VGG16(include_top=False, weights='imagenet', input_shape=(32, 32, 3))

In [5]:
model.summary()

Model: "vgg16"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_1 (InputLayer)         [(None, 32, 32, 3)]       0         
_________________________________________________________________
block1_conv1 (Conv2D)        (None, 32, 32, 64)        1792      
_________________________________________________________________
block1_conv2 (Conv2D)        (None, 32, 32, 64)        36928     
_________________________________________________________________
block1_pool (MaxPooling2D)   (None, 16, 16, 64)        0         
_________________________________________________________________
block2_conv1 (Conv2D)        (None, 16, 16, 128)       73856     
_________________________________________________________________
block2_conv2 (Conv2D)        (None, 16, 16, 128)       147584    
_________________________________________________________________
block2_pool (MaxPooling2D)   (None, 8, 8, 128)         0     

In [5]:
train_features = extract_features(new_x_train)

100%|██████████| 60000/60000 [29:52<00:00, 33.47it/s]


In [6]:
test_features = extract_features(new_x_test)

100%|██████████| 10000/10000 [05:04<00:00, 32.87it/s]


In [7]:
train_features = np.matrix(train_features)
write_matrix_to_file(train_features, file_name="vgg16_train_features.out")

In [8]:
test_features = np.matrix(test_features)
write_matrix_to_file(test_features, file_name="vgg16_test_features.out")