utilDataGenerator.py

#!/usr/bin/python
# -*- coding: utf-8 -*-
from __future__ import print_function
import random
import math
import cv2
import numpy as np
import gc
import utilConst
import utilIO


SHOW_IMAGES = False


# ----------------------------------------------------------------------------
def load_files(array_x_files):
    x_data = []
    y_data = []
    for fname_x in array_x_files:
        fname_y = fname_x.replace(utilConst.X_SUFIX, utilConst.Y_SUFIX)
        img_x = cv2.imread(fname_x, cv2.IMREAD_GRAYSCALE)
        img_y = cv2.imread(fname_y, cv2.IMREAD_GRAYSCALE)
        x_data.append(img_x)
        y_data.append(img_y)

    x_data = np.asarray(x_data).astype('float32')
    x_data = 255. - x_data

    y_data = np.asarray(y_data).astype('float32')   / 255.
    y_data = 1. - y_data

    return x_data, y_data


# ----------------------------------------------------------------------------
# slide a window across the image
def sliding_window(img, stepSize, windowSize):
    #n_steps_y = int( math.ceil( img.shape[0] / float(stepSize) ) )
    #n_steps_x = int( math.ceil( img.shape[1] / float(stepSize) ) )
    n_steps_y = int( math.ceil( (img.shape[0] - windowSize[1] + stepSize) / float(stepSize) ) )
    n_steps_x = int( math.ceil( (img.shape[1] - windowSize[0] + stepSize) / float(stepSize) ) )

    for y in xrange(n_steps_y):
        for x in xrange(n_steps_x):
            posX = x * stepSize
            posY = y * stepSize
            posToX = posX + windowSize[0]
            posToY = posY + windowSize[1]

            if posToX > img.shape[1]:
                posToX = img.shape[1] - 1
                posX = posToX - windowSize[0]

            if posToY > img.shape[0]:
                posToY = img.shape[0] - 1
                posY = posToY - windowSize[1]

            yield (posX, posY, img[posY:posToY, posX:posToX]) # yield the current window


#------------------------------------------------------------------------------
def normalize_data( x_data, norm_type ):
    MEAN = 112.086765946
    STD = 65.5342274216

    x_data = np.asarray(x_data).astype('float32')

    if norm_type == '255':
        x_data /= 255.
    elif norm_type == 'standard':
        mean = np.mean(x_data)
        std = np.std(x_data)
        x_data -= mean
        x_data /= std + 0.00001
    elif norm_type == 'mean':
        mean = np.mean(x_data)
        x_data -= mean
    elif norm_type == 'fstandard':
        x_data -= MEAN
        x_data /= STD + 0.00001
    elif norm_type == 'fmean':
        x_data -= MEAN
    else:
        raise Exception('Norm type not implemented')

    return x_data


# ----------------------------------------------------------------------------
def isSampleSimilarToSource(model_cnn, x_data, num_decimal, threshold_correl_pearson, normalized_list_histogram_source, config):

    roi = x_data.reshape(1, config.window, config.window, 1)

    norm_type = '255'
    roi = normalize_data( roi, norm_type )

    prediction = model_cnn.label_model.predict(roi)
            
    histogram_pred = utilIO.getHistogramBins(prediction, num_decimal)
    list_histogram_pred = histogram_pred.values()
    number_pixels_target = sum(list_histogram_pred)
    normalized_list_histogram_pred = [number / float(number_pixels_target) for number in list_histogram_pred]

    correl_pearson = np.corrcoef(normalized_list_histogram_pred, normalized_list_histogram_source)[0, 1]

    if correl_pearson > threshold_correl_pearson:
        return True
    else:
        return False

# ----------------------------------------------------------------------------
def generate_chunks(
                array_x_files, 
                window_size, 
                step_size, 
                with_filter, 
                histogram_source, 
                model_cnn,
                threshold_correl_pearson,
                num_decimal,
                config):
    x_data = []
    y_data = []

    if with_filter:
        list_histogram_source = histogram_source.values()
        number_pixels_source = sum(list_histogram_source)
        normalized_list_histogram_source = [number / float(number_pixels_source) for number in list_histogram_source]

    total_samples = 0
    total_samples_used = 0
    for fname_x in array_x_files:
        fname_y = fname_x.replace(utilConst.X_SUFIX, utilConst.Y_SUFIX)
        img_x = cv2.imread(fname_x, cv2.IMREAD_GRAYSCALE)
        img_y = cv2.imread(fname_y, cv2.IMREAD_GRAYSCALE)
        assert img_x is not None and img_y is not None
        assert img_x.shape[0] == img_y.shape[0] and img_x.shape[1] == img_y.shape[1]
        assert len(img_x.shape) == 2
        assert len(img_y.shape) == 2

        if SHOW_IMAGES:
            cv2.imshow("img_x", img_x)
            cv2.imshow("Img_y", img_y)
            cv2.waitKey(0)

        if img_x.shape[0] < window_size or img_x.shape[1] < window_size:  # Scale approach
            new_rows = window_size if img_x.shape[0] < window_size else img_x.shape[0]
            new_cols = window_size if img_x.shape[1] < window_size else img_x.shape[1]
            img_x = cv2.resize(img_x, (new_cols, new_rows), interpolation = cv2.INTER_CUBIC)
            img_y = cv2.resize(img_y, (new_cols, new_rows), interpolation = cv2.INTER_CUBIC)

        if SHOW_IMAGES:
            cv2.imshow("img_x", img_x)
            cv2.imshow("Img_y", img_y)
            cv2.waitKey(0)

        coords_x_included = []
        coords_y_included = []
        
        total_samples_img = 0
        total_samples_used_img = 0
        for (x, y, window) in sliding_window(img_x, stepSize=step_size, windowSize=(window_size, window_size)):
            if window.shape[0] != window_size or window.shape[1] != window_size:  # if the window does not meet our desired window size, ignore it
                continue
            
            total_samples_img += 1
            if with_filter:
                is_similar_to_source = isSampleSimilarToSource(model_cnn, window, num_decimal, threshold_correl_pearson, normalized_list_histogram_source, config)
                if is_similar_to_source == False:
                    x_data.append( window.copy() )
                    coords_x_included.append(x)
                    coords_y_included.append(y)
                    total_samples_used_img += 1
            else:
                x_data.append( window.copy() )
                total_samples_used_img += 1
                coords_x_included.append(x)
                coords_y_included.append(y)

            if SHOW_IMAGES:
                cv2.imshow("window_x", window)
                cv2.waitKey(0)
                print(x,y)

        total_samples += total_samples_img
        total_samples_used += total_samples_used_img
        print("Sample extraction in " + str(fname_x))
        print (str(total_samples_used_img) + "/" + str(total_samples_img) + " samples")

        sample_included_found = False
        try:
            last_x_coord = coords_x_included.pop(0)
            last_y_coord = coords_y_included.pop(0)
            for (x, y, window) in sliding_window(img_y, stepSize=step_size, windowSize=(window_size, window_size)):
                if with_filter and sample_included_found == True:
                    if len(coords_x_included) == 0:
                        break
                    last_x_coord = coords_x_included.pop(0)
                    last_y_coord = coords_y_included.pop(0)
                    sample_included_found = False

                if window.shape[0] != window_size or window.shape[1] != window_size:  # if the window does not meet our desired window size, ignore it
                    continue

                if with_filter:
                    if (last_x_coord == x) and (last_y_coord == y):
                        y_data.append( window.copy() )
                        sample_included_found=True
                else:
                    y_data.append( window.copy() )

                if SHOW_IMAGES:
                    cv2.imshow("window_y", window)
                    cv2.waitKey(0)
                    print(x,y)

        except:
            pass

    assert(len(x_data) == len(y_data))

    print ("--------------------------------Summary of sample extraction----------------------------------")
    print (str(total_samples_used) + "/" + str(total_samples) + " samples")
    print ("With filter: " + str(with_filter))

    norm_type = '255'
    x_data = normalize_data( x_data, norm_type )

    #x_data = np.asarray(x_data).astype('float32')
    #x_data = 255. - x_data

    y_data = np.asarray(y_data).astype('float32')   / 255.
    y_data = 1. - y_data
    #y_data = y_data.reshape(y_data.shape[0], y_data.shape[1], y_data.shape[2], 1)

    print('   x_data - min {} mean {} max {}'.format( np.min(x_data), np.mean(x_data), np.max(x_data)))
    print('   y_data - min {} mean {} max {}'.format( np.min(y_data), np.mean(y_data), np.max(y_data)))

    x_data = x_data.reshape(x_data.shape[0], x_data.shape[1], x_data.shape[2], 1)
    y_data = y_data.reshape(y_data.shape[0], y_data.shape[1], y_data.shape[2], 1)

    return x_data, y_data


# ----------------------------------------------------------------------------
class LazyFileLoader:
   def __init__(self, array_x_files, nb_pages):
      self.array_x_files = array_x_files
      self.pos = 0
      if nb_pages <= 0:
          self.page_size = len(array_x_files)
      else:
          self.page_size = len(array_x_files) / nb_pages

   def __len__(self):
       return len(self.array_x_files)

   def __iter__(self):
       return self

   def __next__(self):
       return self.next()

   def truncate_to_size(self, truncate_to):
       self.array_x_files = self.array_x_files[0:truncate_to]

   def set_x_files(self, array_x_files):
       self.array_x_files = array_x_files

   def reset(self):
       self.pos = 0

   def get_pos(self):
       return self.pos

   def set_pos(self, pos):
       self.pos = pos

   def shuffle(self):
       random.shuffle(self.array_x_files)

   def next(self):
       psize = self.page_size
       if self.pos + psize >= len(self.array_x_files):  # last page?
           if self.pos >= len(self.array_x_files):
               raise StopIteration
           else:
               psize = len(self.array_x_files) - self.pos

       print('> Loading page from', self.pos, 'to', self.pos + psize, '...')
       X_data, Y_data = load_files(self.array_x_files[self.pos:self.pos + psize])
       self.pos += self.page_size

       return X_data, Y_data


# ----------------------------------------------------------------------------
class LazyChunkGenerator(LazyFileLoader):
   def __init__(
                self, array_x_files, nb_pages, window_size, step_size, 
                with_filter, 
                histogram_source, 
                model_cnn,
                threshold_correl_pearson,
                num_decimal,
                config):
        LazyFileLoader.__init__(self, array_x_files, nb_pages)
        self.window_size = window_size
        self.step_size = step_size
        self.with_filter = with_filter 
        self.histogram_source = histogram_source
        self.model_cnn = model_cnn
        self.threshold_correl_pearson = threshold_correl_pearson
        self.num_decimal = num_decimal
        self.config = config

   def next(self):
       psize = self.page_size
       if self.pos + psize >= len(self.array_x_files):  # last page?
           if self.pos >= len(self.array_x_files):
               raise StopIteration
           else:
               psize = len(self.array_x_files) - self.pos

       print('> Loading page from', self.pos, 'to', self.pos + psize, '...')
       gc.collect()
       X_data, Y_data = generate_chunks(self.array_x_files[self.pos:self.pos + psize],
                                        self.window_size, self.step_size,
                                        self.with_filter, 
                                        self.histogram_source, 
                                        self.model_cnn,
                                        self.threshold_correl_pearson,
                                        self.num_decimal,
                                        self.config)
       self.pos += self.page_size

       return X_data, Y_data