In [1]:
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import numpy as np
import tensorflow as tf
from tensorflow.contrib import layers
from tensorflow.contrib.layers.python.layers import layers as layers_lib
from tensorflow.python.ops import array_ops

import cv2
import matplotlib.pyplot as plt
from sklearn.cross_validation import train_test_split
import random

import json

tf.logging.set_verbosity(tf.logging.INFO)

# GPU selection (memory)
import os
os.environ["CUDA_DEVICE_ORDER"]="PCI_BUS_ID"   
os.environ["CUDA_VISIBLE_DEVICES"]="2"


  from ._conv import register_converters as _register_converters


In [2]:
data_txt = open('./data_split/5fold_0802.txt', 'r')
data_json = data_txt.read()
tr_data_dir = json.loads(data_json)

In [3]:
# Data info.

width = 640
height = 480
channel = 3


# resize
r_w = 224
r_h = 224

total_pix = r_w * r_h * channel

In [4]:
tr_data_dir['train0'][0]

'/dataset_full/Torn/Torn (1220).png'

In [5]:
def vgg16(features, labels, mode):
    
    """Model function for CNN."""
    # Input Layer
    # Reshape X to 4-D tensor: [batch_size, height, width, channels]
    # Our Fishing net image size is 640x480 and 3-channel (RGB)
    input_layer = tf.reshape(features["x"], [-1, 224, 224, 3])
    dropout_keep_prob = 0.5
    num_classes = 2
    is_training = True
    
    
    net = layers_lib.repeat(
        input_layer, 2, layers.conv2d, 64, [3, 3], scope='conv1')
    net = layers_lib.max_pool2d(net, [2, 2], scope='pool1')
    net = layers_lib.repeat(net, 2, layers.conv2d, 128, [3, 3], scope='conv2')
    net = layers_lib.max_pool2d(net, [2, 2], scope='pool2')
    net = layers_lib.repeat(net, 3, layers.conv2d, 256, [3, 3], scope='conv3')
    net = layers_lib.max_pool2d(net, [2, 2], scope='pool3')
    net = layers_lib.repeat(net, 3, layers.conv2d, 512, [3, 3], scope='conv4')
    net = layers_lib.max_pool2d(net, [2, 2], scope='pool4')
    net = layers_lib.repeat(net, 3, layers.conv2d, 512, [3, 3], scope='conv5')
    net = layers_lib.max_pool2d(net, [2, 2], scope='pool5')
    # Use conv2d instead of fully_connected layers.
    net = layers.conv2d(net, 4096, [7, 7], padding='VALID', scope='fc6')
    net = layers_lib.dropout(
        net, dropout_keep_prob, is_training=is_training, scope='dropout6')
    net = layers.conv2d(net, 4096, [1, 1], scope='fc7')
    net = layers_lib.dropout(
        net, dropout_keep_prob, is_training=is_training, scope='dropout7')
    net = layers.conv2d(
        net,
        num_classes, [1, 1],
        activation_fn=None,
        normalizer_fn=None,
        scope='fc8')
    net = array_ops.squeeze(net, [1, 2], name='fc8/squeezed')
    
    logits = net
    


    predictions = {
        # Generate predictions (for PREDICT and EVAL mode)
        "classes": tf.argmax(input=logits, axis=1),
        # Add `softmax_tensor` to the graph. It is used for PREDICT and by the
        # `logging_hook`.
        "probabilities": tf.nn.softmax(logits, name="softmax_tensor")
    }
    if mode == tf.estimator.ModeKeys.PREDICT:
        return tf.estimator.EstimatorSpec(mode=mode, predictions=predictions)

    # Calculate Loss (for both TRAIN and EVAL modes)
    loss = tf.losses.sparse_softmax_cross_entropy(labels=labels, logits=logits)
    acc = tf.metrics.accuracy(labels=labels, predictions=predictions["classes"])

    tf.summary.scalar('train_acc', acc[1])
    # sparse_softmax_cross_entropy cannot use one-hot encoding

    #loss = tf.nn.sigmoid_cross_entropy_with_logits(labels=labels, logits=logits)

    # Configure the Training Op (for TRAIN mode)
    if mode == tf.estimator.ModeKeys.TRAIN:
        #optimizer = tf.train.GradientDescentOptimizer(learning_rate=0.001)
        optimizer = tf.train.AdamOptimizer(learning_rate=0.0001)
        train_op = optimizer.minimize(
            loss=loss,
            global_step=tf.train.get_global_step())
        return tf.estimator.EstimatorSpec(mode=mode, loss=loss, train_op=train_op)

    # Add evaluation metrics (for EVAL mode)
    eval_metric_ops = {
        "accuracy": tf.metrics.accuracy(
            labels=labels, predictions=predictions["classes"])}
    return tf.estimator.EstimatorSpec(
        mode=mode, loss=loss, eval_metric_ops=eval_metric_ops)

In [6]:
#config = tf.ConfigProto()
#config.gpu_options.per_process_gpu_memory_fraction = 0.9
#session = tf.Session(config=config)

k = 2
total_res = {}
add_dir = '/hdd3/dhj_container/DB'


val_result = []

f_dir = "/hdd3/dhj_container/ICROS_vgg/kfold0811_%d/" % k

if not tf.gfile.Exists(f_dir):
    tf.gfile.MakeDirs(f_dir)

net_classifier = tf.estimator.Estimator(
    model_fn=vgg16, model_dir=f_dir)

# Set up logging for predictions
# Log the values in the "Softmax" tensor with label "probabilities"
tensors_to_log = {"probabilities": "softmax_tensor"}
logging_hook = tf.train.LoggingTensorHook(
    tensors=tensors_to_log, every_n_iter=50)



tr_data = np.zeros((len(tr_data_dir['train%d'%k]), total_pix), dtype=np.float32)
tr_label = np.zeros((len(tr_data_dir['train%d'%k]), 1), dtype=np.int32)

for j in range(len(tr_data)):
    img = cv2.imread(add_dir+tr_data_dir['train%d'%k][j])
    img2 = cv2.resize(img, (r_w, r_h), interpolation=cv2.INTER_CUBIC)
    tr_data[j,:] = img2.flatten()

    if 'Untorn' in tr_data_dir['train%d'%k][j]:
        tr_label[j] = 0
    elif 'normal' in tr_data_dir['train%d'%k][j]:
        tr_label[j] = 0

    else:
        tr_label[j] = 1


val_data = np.zeros((len(tr_data_dir['valid%d'%k]), total_pix), dtype=np.float32)
val_label = np.zeros((len(tr_data_dir['valid%d'%k]), 1), dtype=np.int32)

for j in range(len(val_data)):
    img = cv2.imread(add_dir+tr_data_dir['valid%d'%k][j])
    img2 = cv2.resize(img, (r_w, r_h), interpolation=cv2.INTER_CUBIC)
    val_data[j,:] = img2.flatten()

    if 'Untorn' in tr_data_dir['valid%d'%k][j]:
        val_label[j] = 0
    elif 'normal' in tr_data_dir['valid%d'%k][j]:
        val_label[j] = 0

    else:
        val_label[j] = 1




batch_s = 32
epochs = 30
tr_steps = int(tr_data.shape[0]/batch_s*epochs)
step_in_epoch = int(tr_data.shape[0]/batch_s)+1
in_steps = 1




train_input_fn = tf.estimator.inputs.numpy_input_fn(
    x={"x": tr_data},
    y=tr_label,
    batch_size=batch_s,
    num_epochs=epochs,
    shuffle=False)

eval_input_fn = tf.estimator.inputs.numpy_input_fn(
    x={"x": val_data},
    y=val_label,
    batch_size=64,
    num_epochs=1,
    shuffle=False)

train_spec = tf.estimator.TrainSpec(input_fn=train_input_fn, max_steps=tr_steps)
eval_spec = tf.estimator.EvalSpec(input_fn=eval_input_fn, steps=None, throttle_secs=100)

tf.estimator.train_and_evaluate(net_classifier, train_spec, eval_spec)

INFO:tensorflow:Using default config.
INFO:tensorflow:Using config: {'_global_id_in_cluster': 0, '_is_chief': True, '_num_ps_replicas': 0, '_task_type': 'worker', '_master': '', '_save_summary_steps': 100, '_save_checkpoints_steps': None, '_save_checkpoints_secs': 600, '_session_config': None, '_keep_checkpoint_every_n_hours': 10000, '_model_dir': '/hdd3/dhj_container/ICROS_vgg/kfold0811_2/', '_log_step_count_steps': 100, '_keep_checkpoint_max': 5, '_evaluation_master': '', '_tf_random_seed': None, '_num_worker_replicas': 1, '_service': None, '_task_id': 0, '_cluster_spec': <tensorflow.python.training.server_lib.ClusterSpec object at 0x7f6c6a51e128>}
INFO:tensorflow:Running training and evaluation locally (non-distributed).
INFO:tensorflow:Start train and evaluate loop. The evaluate will happen after 100 secs (eval_spec.throttle_secs) or training is finished.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensor

KeyboardInterrupt: 