# Snapshot Serengeti Inception-V3

## Disclaimer
This uses the pre-built and open source inception v3 model as a baseline.
For more information see https://www.tensorflow.org/tutorials/image_recognition#usage_with_python_api.
You can also find the original source code that is modified here at https://github.com/tensorflow/models

## Setup

In [1]:
# Basic Data Imports
import tensorflow as tf
import numpy as np
import matplotlib.pyplot as plt

# Google Inception Imports
from six.moves import urllib
import os
import sys
import tarfile
import re

In [2]:
# Default codebase is vagrant
# If you aren't using vagrant replace codebase with your personal
# root.  For example, ~/home/projects/code-base
CODEBASE_DIR = '/vagrant'

# General Constants
DATA_DIR = CODEBASE_DIR + '/data'
MODEL_DIR = CODEBASE_DIR + '/models'

# Google Constants
DATA_URL = 'http://download.tensorflow.org/models/image/imagenet/inception-2015-12-05.tgz'
DEST_DIRECTORY = MODEL_DIR +'/inceptionv3'
NUM_TOP_PREDICTIONS = 5

# Global State
GRAPH_STARTED = False

np.random.seed(1)

In [3]:
class NodeLookup(object):
  """Converts integer node ID's to human readable labels."""

  def __init__(self,
               label_lookup_path=None,
               uid_lookup_path=None):
    if not label_lookup_path:
      label_lookup_path = os.path.join(
          DEST_DIRECTORY, 'imagenet_2012_challenge_label_map_proto.pbtxt')
    if not uid_lookup_path:
      uid_lookup_path = os.path.join(
          DEST_DIRECTORY, 'imagenet_synset_to_human_label_map.txt')
    self.node_lookup = self.load(label_lookup_path, uid_lookup_path)

  def load(self, label_lookup_path, uid_lookup_path):
    """Loads a human readable English name for each softmax node.

    Args:
      label_lookup_path: string UID to integer node ID.
      uid_lookup_path: string UID to human-readable string.

    Returns:
      dict from integer node ID to human-readable string.
    """
    if not tf.gfile.Exists(uid_lookup_path):
      tf.logging.fatal('File does not exist %s', uid_lookup_path)
    if not tf.gfile.Exists(label_lookup_path):
      tf.logging.fatal('File does not exist %s', label_lookup_path)

    # Loads mapping from string UID to human-readable string
    proto_as_ascii_lines = tf.gfile.GFile(uid_lookup_path).readlines()
    uid_to_human = {}
    p = re.compile(r'[n\d]*[ \S,]*')
    for line in proto_as_ascii_lines:
      parsed_items = p.findall(line)
      uid = parsed_items[0]
      human_string = parsed_items[2]
      uid_to_human[uid] = human_string

    # Loads mapping from string UID to integer node ID.
    node_id_to_uid = {}
    proto_as_ascii = tf.gfile.GFile(label_lookup_path).readlines()
    for line in proto_as_ascii:
      if line.startswith('  target_class:'):
        target_class = int(line.split(': ')[1])
      if line.startswith('  target_class_string:'):
        target_class_string = line.split(': ')[1]
        node_id_to_uid[target_class] = target_class_string[1:-2]

    # Loads the final mapping of integer node ID to human-readable string
    node_id_to_name = {}
    for key, val in node_id_to_uid.items():
      if val not in uid_to_human:
        tf.logging.fatal('Failed to locate: %s', val)
      name = uid_to_human[val]
      node_id_to_name[key] = name

    return node_id_to_name

  def id_to_string(self, node_id):
    if node_id not in self.node_lookup:
      return ''
    return self.node_lookup[node_id]

In [4]:
# Download Google Incpetion v3 Model
# Based on https://www.tensorflow.org/tutorials/image_recognition#usage_with_python_api

def maybe_download_and_extract():
  """Download and extract model tar file."""
  if not os.path.exists(DEST_DIRECTORY):
    os.makedirs(DEST_DIRECTORY)
  filename = DATA_URL.split('/')[-1]
  filepath = os.path.join(DEST_DIRECTORY, filename)
  if not os.path.exists(filepath):
    def _progress(count, block_size, total_size):
      sys.stdout.write('\r>> Downloading %s %.1f%%' % (
          filename, float(count * block_size) / float(total_size) * 100.0))
      sys.stdout.flush()
    filepath, _ = urllib.request.urlretrieve(DATA_URL, filepath, _progress)
    print()
    statinfo = os.stat(filepath)
    print('Successfully downloaded', filename, statinfo.st_size, 'bytes.')
  tarfile.open(filepath, 'r:gz').extractall(DEST_DIRECTORY)


In [5]:
def create_graph():
  global GRAPH_STARTED
  if GRAPH_STARTED:
    return

  GRAPH_STARTED = True
  """Creates a graph from saved GraphDef file and returns a saver."""
  # Creates graph from saved graph_def.pb.
  with tf.gfile.FastGFile(os.path.join(
      DEST_DIRECTORY, 'classify_image_graph_def.pb'), 'rb') as f:
    graph_def = tf.GraphDef()
    graph_def.ParseFromString(f.read())
    _ = tf.import_graph_def(graph_def, name='')

In [6]:
def run_inference_on_image(image):
  """Runs inference on an image.

  Args:
    image: Image file name.

  Returns:
    Nothing
  """
  if not tf.gfile.Exists(image):
    tf.logging.fatal('File does not exist %s', image)
  image_data = tf.gfile.FastGFile(image, 'rb').read()

  # Creates graph from saved GraphDef.
  create_graph()

  with tf.Session() as sess:
    # Some useful tensors:
    # 'softmax:0': A tensor containing the normalized prediction across
    #   1000 labels.
    # 'pool_3:0': A tensor containing the next-to-last layer containing 2048
    #   float description of the image.
    # 'DecodeJpeg/contents:0': A tensor containing a string providing JPEG
    #   encoding of the image.
    # Runs the softmax tensor by feeding the image_data as input to the graph.
    softmax_tensor = sess.graph.get_tensor_by_name('softmax:0')
    predictions = sess.run(softmax_tensor,
                           {'DecodeJpeg/contents:0': image_data})
    predictions = np.squeeze(predictions)

    # Creates node ID --> English string lookup.
    node_lookup = NodeLookup()

    top_k = predictions.argsort()[-NUM_TOP_PREDICTIONS:][::-1]
    top_k_list = []
    for node_id in top_k:
      human_string = node_lookup.id_to_string(node_id)
      score = predictions[node_id]
      top_k_list.append((human_string, node_id, score))
    
    return top_k_list

## Analysis

In [7]:
# Run classification on snapshot data
maybe_download_and_extract()
elephant_dir = DATA_DIR + '/snapshot/Elephant'
img_elephants = [os.path.join(elephant_dir, img) for img in os.listdir(elephant_dir)]

imgs = np.random.randint(0, len(img_elephants), 5)

>> Downloading inception-2015-12-05.tgz 100.0%
Successfully downloaded inception-2015-12-05.tgz 88931400 bytes.


### Random image exploration

In [8]:
Image(img_elephants[imgs[0]])

NameError: name 'Image' is not defined

In [None]:
run_inference_on_image(img_elephants[0])

In [None]:
Image(img_elephants[imgs[1]])

In [None]:
run_inference_on_image(img_elephants[1])

In [None]:
Image(img_elephants[imgs[2]])

In [None]:
run_inference_on_image(img_elephants[2])

In [None]:
Image(img_elephants[imgs[3]])

In [None]:
run_inference_on_image(img_elephants[3])

In [None]:
Image(img_elephants[imgs[4]])

In [None]:
run_inference_on_image(img_elephants[4])

In [None]:
### TODO: Score everything, track distribution of scorings
### Manually look at ImageNet and pick node_ids that represent elephants
### Create manual classification based on these

### Use non-elephants as negative examples, see how it performs overall