prepare_model_coco.py

#import
import pdb
from sys import stdout
import scipy
import  cPickle as pickle
import numpy as np
import matplotlib.pyplot as plt
#matplotlib inline
import sys
#sys.path.insert(0, caffe_root + 'python')
import caffe
plt.rcParams['figure.figsize'] = (10, 10)
plt.rcParams['image.interpolation'] = 'nearest'
plt.rcParams['image.cmap'] = 'gray'
import os
import pandas as pd
import nltk

#Setup
print 'Start Setup'
#originalImagesPath = 'data/coco/originalImages'
trainImagesPath = '/tmp3/alvin/dataset/MSCOCO2014/train2014_224/'
valImagesPath = '/tmp3/alvin/dataset/MSCOCO2014/val2014_224/'
vgg_ilsvrc_19_layoutFileName = '/tmp3/alvin/VGG_ILSVRC_19_layers_deploy.prototxt'
vgg_ilsvrc_19_modelFileName = '/tmp3/alvin/VGG_ILSVRC_19_layers.caffemodel'
dataPath = '/tmp3/alvin/arctic_data/coco/'
annotation_path = '/tmp3/alvin/dataset/MSCOCO2014/captions_train2014.json'
#splitFileName = dataPath + 'dataset_coco.json'
experimentPrefix = '.exp1'
print 'End Setup'

#Setup caffe
print 'Start Setup caffe'
caffe.set_device(1)
caffe.set_mode_gpu()
net = caffe.Net(vgg_ilsvrc_19_layoutFileName,vgg_ilsvrc_19_modelFileName,caffe.TEST)
# input preprocessing: 'data' is the name of the input blob == net.inputs[0]
transformer = caffe.io.Transformer({'data': net.blobs['data'].data.shape})
transformer.set_transpose('data', (2,0,1))
transformer.set_mean('data', np.load('/tmp3/alvin/ilsvrc_2012_mean.npy').mean(1).mean(1)) # mean pixel
transformer.set_raw_scale('data', 255)  # the reference model operates on images in [0,255] range instead of [0,1]
transformer.set_channel_swap('data', (2,1,0))  # the reference model has channels in BGR order instead of RGB
print 'End Setup caffe'

#filelist:
#./splits/coco_val.txt
#./splits/coco_test.txt
#./splits/coco_train.txt

# set net to batch size of 50
# net.blobs['data'].reshape(10,3,224,224)
print 'Start middle'
files = [ 'val','test','train']
for fname in files:
    print fname 
    f = open('./splits/coco_'+fname+'.txt')
    counter = 0
    imageList = [i for i in f]
    numImage = len(imageList)
    #pdb.set_trace()
    result = np.empty((numImage, 100352))

    for i in range(numImage):
        fn = imageList[i].rstrip()
        if fname=='train':
            net.blobs['data'].data[...] = transformer.preprocess('data', caffe.io.load_image(trainImagesPath+fn))
        else:
            net.blobs['data'].data[...] = transformer.preprocess('data', caffe.io.load_image(valImagesPath+fn))
        out = net.forward()
        feat = net.blobs['conv5_4'].data[0]
        reshapeFeat = np.swapaxes(feat,0,2)
        reshapeFeat2 = np.reshape(reshapeFeat,(1,-1))
        counter += 1
        stdout.write("\r%d" % counter)
        stdout.flush()
        result[i,:] = reshapeFeat2
    print result.shape

    resultSave = scipy.sparse.csr_matrix(result)
    resultSave32 = resultSave.astype('float32')
    if fname == 'train':
        np.savez(dataPath + 'coco_feature.' + fname + experimentPrefix, data=resultSave32.data, indices=resultSave32.indices, indptr=resultSave32.indptr, shape=resultSave.shape)
    else:
        fileName = open(dataPath + 'coco_feature.' + fname + experimentPrefix + '.pkl','wb') 
        pickle.dump(resultSave32, fileName, -1) 
        fileName.close()

print 'End middle'


print 'Start end'
#np.savez(dataPath + 'coco_feature.' + fname + experimentPrefix, data=resultSave32.data, indices=resultSave32.indices, indptr=resultSave32.indptr, shape=resultSave.shape)

def save_sparse_csr(filename,array):
    np.savez(filename,data = array.data ,indices=array.indices, indptr =array.indptr, shape=array.shape)

def load_sparse_csr(filename):
    loader = np.load(filename)
    return csr_matrix((loader['data'], loader['indices'], loader['indptr']), shape = loader['shape'])

capDict = pickle.load(open('capdict.pkl','rb'))

files = ['test', 'val']
for name in files:
    counter = 0
    with open(dataPath + 'coco_feature.' + name + experimentPrefix + '.pkl','rb') as fp:
        feat = pickle.load(fp)
    filenames = open('./splits/coco_'+name+'.txt')
    cap = []
    for imageFile in filenames:
        imageFile = imageFile.rstrip()
        for sen in capDict[imageFile]:
            cap.append([sen.rstrip(), counter])
        counter += 1
    saveFile = open(dataPath + 'coco_align.' + name + experimentPrefix + '.pkl', 'wb') 
    pickle.dump(cap, saveFile, protocol=pickle.HIGHEST_PROTOCOL) 
    pickle.dump(feat, saveFile, protocol=pickle.HIGHEST_PROTOCOL)
    saveFile.close()
    filenames.close()

files = ['train']
for name in files:
    counter = 0
    filenames = open('./splits/coco_'+name+'.txt')
    cap = []
    for imageFile in filenames:
        imageFile = imageFile.rstrip()
        for sen in capDict[imageFile]:
            cap.append([sen.rstrip(), counter])
        counter += 1
    saveFile = open(dataPath + 'coco_align.' + name + experimentPrefix + '.pkl', 'wb') 
    pickle.dump(cap, saveFile, protocol=pickle.HIGHEST_PROTOCOL) 
    saveFile.close()
    filenames.close()

#print wordsDict['Two']
#print resultSave32

print 'Start end'