In [1]:
%load_ext autoreload
%autoreload 2
import numpy as np
import tensorflow as tf
from features.settings import Baseline_Settings, Pair_Hinge_Settings, Pair_Log_Settings, Triplet_Hinge_Settings, Triplet_Log_Settings
from features.models import ConvModelSmall, ConvModelMedium, ConvModelLarge
from features.models import GCNNModelSmall, GCNNModelMedium, GCNNModelLarge
from classes.models import LinearClassifier
from datasets import load_mnist_datasets, load_cifar10
from sklearn.svm import LinearSVC
import time

  return f(*args, **kwds)
  from ._conv import register_converters as _register_converters
Using TensorFlow backend.


In [2]:
data, samplers, pair_samplers, triplet_samplers = load_cifar10(augment=True)

CIFAR-10 loaded in 101 seconds


In [3]:
def test_model(feature_model, settings, data, num_features, num_classes, feature_samplers, classification_samplers,
               f_num_steps, f_lr, f_keep_prob, f_reg, c_num_steps, c_lr, c_reg):
    
    tf.reset_default_graph()
    
    f_train, f_valid, f_test = feature_samplers
    c_train, c_valid, c_test = classification_samplers
    (x_train, y_train), (x_valid, y_valid), (x_test, y_test) = data
    _, H, W, C = x_train.shape
    
    x = tf.placeholder(tf.float32, shape=[None, H, W, C])
    y = tf.placeholder(tf.int64, shape=[None])    
    dropout = tf.placeholder(tf.float32)
    training = tf.placeholder(tf.bool)
    f_model = feature_model(x=x, y=y, settings=settings, num_chan=C, num_features=num_features, 
              lr=f_lr, reg=f_reg, dropout=dropout, training=training)
    
    features = tf.placeholder(tf.float32, shape=[None, num_features])
    c_model = LinearClassifier(x=features, y=y, num_features=num_features, num_classes=num_features, 
                               lr=c_lr, reg=c_reg)
    
    with tf.Session() as sess:
        sess.run(tf.global_variables_initializer())
        
        print("begin training features // num_features: %g, lr: %g, reg: %g, dropout: %g" %(num_features, f_lr, f_reg, f_keep_prob))
        train_time = time.time()
        for step in range(f_num_steps):        
            x_, y_ = f_train.sample(700)
            sess.run(f_model.optimize, feed_dict={x:x_, y:y_, dropout:f_keep_prob, training:True})     
            if step % 1000 == 0:
                train_loss, train_acc = sess.run([f_model.loss, f_model.acc], 
                                                 feed_dict={x:x_, y:y_, dropout:1.0, training:False})
                print("\tstep %d: train loss %g, train error %g"%(step, train_loss, 1 - train_acc))  
        train_time = time.time() - train_time
        print("end training features // time elapsed: %.4f s"%(train_time))
        
        eval_test_time = time.time()
        x_, y_ = f_valid.sample(1000)
        test_error = 1 - sess.run(f_model.acc, feed_dict={x:x_, y:y_, dropout:1.0, training:False})
        eval_test_time = time.time() - eval_test_time
        print("validation set error: %.4f // time elapsed: %.4f s"%(test_error, eval_test_time))
        
        eval_test_time = time.time()
        x_, y_ = f_test.sample(1000)
        test_error = 1 - sess.run(f_model.acc, feed_dict={x:x_, y:y_, dropout:1.0, training:False})
        eval_test_time = time.time() - eval_test_time
        print("test set error: %.4f // time elapsed: %.4f s"%(test_error, eval_test_time))
        
        print("begin training classifier")
        train_time = time.time()
        for step in range(c_num_steps):        
            x_, y_ = c_train.sample(700)
            features_ = sess.run(f_model.features, feed_dict={x:x_, dropout:1.0, training:False})
            sess.run(c_model.optimize, feed_dict={features:features_, y:y_, x:x_, dropout:1.0, training:False})
            if step % 1000 == 0:
                train_loss, train_acc = sess.run([c_model.loss, c_model.acc], feed_dict={features:features_, y:y_})
                print("\tstep %d: train loss %g, train error %g"%(step, train_loss, 1 - train_acc))  
        train_time = time.time() - train_time
        print("end training classifier // time elapsed: %.4f s"%(train_time))
        
        eval_test_time = time.time()
        features_ = sess.run(f_model.features, feed_dict={x:x_valid, dropout:1.0, training:False})
        test_error = 1 - sess.run(c_model.acc, feed_dict={features:features_, y:y_valid})
        eval_test_time = time.time() - eval_test_time
        print("validation set error: %.4f // time elapsed: %.4f s"%(test_error, eval_test_time))
        
        eval_test_time = time.time()
        features_ = sess.run(f_model.features, feed_dict={x:x_test, dropout:1.0, training:False})
        test_error = 1 - sess.run(c_model.acc, feed_dict={features:features_, y:y_test})
        eval_test_time = time.time() - eval_test_time
        print("test set error: %.4f // time elapsed: %.4f s"%(test_error, eval_test_time))

In [4]:
test_model(feature_model=GCNNModelSmall, settings=Baseline_Settings, num_features=10, num_classes=10,
           data=data, feature_samplers=samplers, classification_samplers=samplers,           
           f_num_steps=50000, f_lr=0.01, f_keep_prob=0.6, f_reg=0.001, 
           c_num_steps=30000, c_lr=0.005, c_reg=0.01)

begin training features // num_features: 10, lr: 0.01, reg: 0.001, dropout: 0.6
	step 0: train loss 2.86984, train error 0.89
	step 1000: train loss 2.16015, train error 0.598571
	step 2000: train loss 1.94927, train error 0.571429
	step 3000: train loss 1.86522, train error 0.528571
	step 4000: train loss 1.55336, train error 0.42
	step 5000: train loss 1.62448, train error 0.465714
	step 6000: train loss 1.5064, train error 0.414286
	step 7000: train loss 1.41088, train error 0.374286
	step 8000: train loss 1.40901, train error 0.384286
	step 9000: train loss 1.3384, train error 0.362857
	step 10000: train loss 1.22834, train error 0.335714
	step 11000: train loss 1.17861, train error 0.33
	step 12000: train loss 1.14353, train error 0.304286
	step 13000: train loss 1.09757, train error 0.301429
	step 14000: train loss 0.989379, train error 0.264286
	step 15000: train loss 0.997888, train error 0.278571
	step 16000: train loss 0.947964, train error 0.271429
	step 17000: train loss 0.

In [5]:
test_model(feature_model=GCNNModelSmall, settings=Triplet_Hinge_Settings, num_features=10, num_classes=10,
           data=data, feature_samplers=triplet_samplers, classification_samplers=samplers,           
           f_num_steps=50000, f_lr=0.01, f_keep_prob=0.6, f_reg=0.001, 
           c_num_steps=30000, c_lr=0.01, c_reg=0.1)

begin training features // num_features: 10, lr: 0.01, reg: 0.001, dropout: 0.6
	step 0: train loss 1.5273, train error 0.5
	step 1000: train loss 1.3048, train error 0.344286
	step 2000: train loss 1.19955, train error 0.327143
	step 3000: train loss 1.1406, train error 0.305714
	step 4000: train loss 1.07139, train error 0.291429
	step 5000: train loss 1.07001, train error 0.311429
	step 6000: train loss 0.933511, train error 0.25
	step 7000: train loss 0.943549, train error 0.267143
	step 8000: train loss 0.874594, train error 0.234286
	step 9000: train loss 0.893579, train error 0.252857
	step 10000: train loss 0.80692, train error 0.225714
	step 11000: train loss 0.786572, train error 0.225714
	step 12000: train loss 0.777817, train error 0.217143
	step 13000: train loss 0.74501, train error 0.217143
	step 14000: train loss 0.702917, train error 0.207143
	step 15000: train loss 0.671019, train error 0.185714
	step 16000: train loss 0.702287, train error 0.217143
	step 17000: train