In [1]:
import numpy as np
import matplotlib.pyplot as plt
import os, time
from skimage import io
from skimage.feature import hog
from sklearn import svm
from sklearn import linear_model
from sklearn import metrics
from sklearn import calibration
import pickle
import copy
import csv

In [2]:
plt.rcParams['figure.figsize'] = (15,15)
plt.rcParams.update({'font.size': 12})

In [3]:
RESULTS_FH = None # global

In [4]:
DIR = 'Individual_Component'
SEED = 42

# [HOG parameters]
# img (w,h): (64,80)
# NFEATURES = nblocks * norientations/cell * ncells/block
POWER_LAW_COMPRESSION = True

BLOCK_SIZE_LIST = [1, 2, 3, 4]
BLOCK_NORM_LIST = ['L2-Hys'] # available: ['L1', 'L1-sqrt', 'L2', 'L2-Hys']
CELL_PIXEL_LIST = [4, 5, 6, 7, 8, 9, 10, 14]
ORIENTATION_LIST = [13]#[6, 7, 8, 9, 10, 11, 12]
NPOS_TRAINING_IMGS = 3000
NNEG_TRAINING_IMGS = 3000

## (Test platform test runs)

# BLOCK_SIZE_LIST = [1]
# BLOCK_NORM_LIST = ['L1']
# CELL_PIXEL_LIST = [4]
# ORIENTATION_LIST = [8, 6]
# NPOS_TRAINING_IMGS = 10
# NNEG_TRAINING_IMGS = 10

# BLOCK_SIZE_LIST = [1,2,4]
# BLOCK_NORM_LIST = ['L2-Hys'] # available: ['L1', 'L1-sqrt', 'L2', 'L2-Hys']
# CELL_PIXEL_LIST = [5, 6, 7, 8, 9, 10, 14]
# ORIENTATION_LIST = [7,11]
# NPOS_TRAINING_IMGS = 3000
# NNEG_TRAINING_IMGS = 3000

In [5]:
if RESULTS_FH != None:
    RESULTS_FH.close()
print('Results file closed.')

Results file closed.


In [6]:
def list_mul(l, num):
    return tuple(map(lambda x: int(num * x), l))

# Histogram of Oriented Gradients
def run_hog(img, visualize=False):
    global NORIENTATIONS, CELL_PIXELSHAPE, CELLS_PER_BLOCK, BLOCK_NORM, POWER_LAW_COMPRESSION
    result = hog(img, orientations=NORIENTATIONS, 
                 pixels_per_cell=CELL_PIXELSHAPE, cells_per_block=CELLS_PER_BLOCK, 
                 block_norm=BLOCK_NORM, visualize=visualize, transform_sqrt=POWER_LAW_COMPRESSION,
                 multichannel=True)
    return result

In [7]:
# Reference: https://www.kaggle.com/manikg/training-svm-classifier-with-hog-features

def log_result(s, on_console=True): # debug log...
    global RESULTS_FH
    if on_console:
        print(s)
    print(s, file=RESULTS_FH)

# Code to load the dataset
def get_dataset_fp(is_train):
    if is_train:
        subroot = 'train'
    else:
        subroot = 'test'
    base_fp = os.path.join(DIR, subroot)
    pos_dirs = []
    neg_dirs = []
    for dir_name in os.listdir(base_fp): # all files & dirs
        subfp = os.path.join(base_fp, dir_name)
        if not os.path.isdir(subfp):
            continue    
        for subdir_name in os.listdir(subfp):
            subsubfp = os.path.join(subfp, subdir_name)
            if not os.path.isdir(subsubfp):
                continue
            if 'positive' in dir_name:
                pos_dirs.append(subsubfp)
            elif 'negative' in dir_name:
                neg_dirs.append(subsubfp)
    return pos_dirs, neg_dirs

def get_subset_images(fp, nimgs=None, preproc=False):
    results = []
    results_fp = []
    count = 0
    for img_fn in os.listdir(fp):
        img_fp = os.path.join(fp, img_fn)
        if os.path.isdir(img_fp) or img_fn[-4:].lower() != '.pnm':
            continue
        img = io.imread(img_fp)
        if preproc: # proprocess as HOG
            hog_fd = run_hog(img)
            results.append(hog_fd)
        else:
            results.append(img)
        results_fp.append(img_fp)
        count += 1 # restrict num imgs loaded
        if nimgs != None and count >= nimgs:
            break
    return results, results_fp

NO_PERSON = 0
IS_PERSON = 1

#def load_images(is_train, shuffle, npos_imgs=None, nneg_imgs=None, save_fn=None):
def load_images(is_train, npos_imgs=None, nneg_imgs=None):
    pos_dirs, neg_dirs = get_dataset_fp(is_train=is_train)    
    x_train = []
    y_train = []
    fp_train = []
    # get preprocessed training/testing data
    for fp in pos_dirs:
        start_time = time.time()
        cur_subset, cur_subset_fp = get_subset_images(fp, npos_imgs, False)
        x_train += cur_subset
        fp_train += cur_subset_fp
        log_result('  * {:.3f}s runtime (images loaded): {}'.format(time.time() - start_time,fp))
        if npos_imgs != None:
            npos_imgs -= len(cur_subset)
            if npos_imgs <= 0:
                break
    pos_length = len(x_train)
    y_train += [IS_PERSON] * pos_length
    
    for fp in neg_dirs:
        start_time = time.time()
        cur_subset, cur_subset_fp = get_subset_images(fp, nneg_imgs, False)
        x_train += cur_subset
        fp_train += cur_subset_fp
        log_result('  * {:.3f}s runtime (images loaded): {}'.format(time.time() - start_time,fp))
        if nneg_imgs != None:
            nneg_imgs -= len(cur_subset)
            if nneg_imgs <= 0:
                break
    y_train += [NO_PERSON] * (len(x_train) - pos_length)
    return x_train, y_train, fp_train

def images_to_hog(x_train, y_train, fp_train, shuffle, save_fn=None):
    # convert each img to hog (intermed step added to cache original unproc'd images)
    start_time = time.time()
    for i in range(len(x_train)):
        x_train[i] = run_hog(x_train[i])
    hog_shape = x_train[0].shape
    log_result('  * {:.3f}s runtime (conversion to HOG)'.format(time.time() - start_time))
    
    # shuffle training data
    #print('Reformatting data...')
    x_train = np.array(x_train)
    y_train = np.array(y_train)
    fp_train_index = np.arange(len(fp_train)) # create unique IDs (from 0)
    
    if shuffle:
        y_train = y_train.reshape(len(y_train),1)
        fp_train_index = fp_train_index.reshape(len(fp_train_index),1)
        
        data_frame = np.hstack((x_train,y_train, fp_train_index))
        #print('Reshuffling data...')
        start_time = time.time()
        np.random.seed(SEED)
        np.random.shuffle(data_frame)
        x_train = data_frame[:,:-2]
        y_train = data_frame[:,-2].ravel()
        fp_train_index = data_frame[:,-1].ravel()
        log_result('  * {:.3f}s runtime (shuffling)'.format(time.time() - start_time))
    
    log_result('HOG descriptor size: ' + str(hog_shape))
    result = (x_train, y_train, fp_train_index, fp_train)
    # save loaded images
    if save_fn != None:
        with open(save_fn, 'wb') as fh:
            pickle.dump(result, fh)
    return result
    
# Code to generate the SVM model
def gen_model(model_fn, x_train, y_train):
    # generate SVM model
    start_time = time.time()
    #clf = svm.SVC(probability=True)
    #clf = linear_model.SGDClassifier()
    clf = calibration.CalibratedClassifierCV(base_estimator = svm.LinearSVC(loss='hinge'), cv=5)
    clf.fit(x_train, y_train)
    log_result('{:.3f}s runtime (SGD training)'.format(time.time() - start_time))
    
    # save SVM model
    with open(model_fn, 'wb') as fh:
        pickle.dump(clf, fh)
    return clf

In [8]:
# Computes statistics for the classifier's performance
def run_test(clf, x_test, y_test):
    start_time = time.time()
    y_pred = clf.predict(x_test)
    y_prob = clf.predict_proba(x_test)
        
    # y_prob: https://scikit-learn.org/stable/modules/generated/sklearn.svm.SVC.html
    #  - shape: (nsamples, nclasses), by order of `clf.classes_`
    elapsed_time = time.time() - start_time
    auc = metrics.roc_auc_score(y_test, y_prob[:,IS_PERSON], average='weighted')
    accuracy = metrics.accuracy_score(y_test, y_pred)
    precision = metrics.precision_score(y_test, y_pred, average='weighted')
    recall = metrics.recall_score(y_test, y_pred, average='weighted')
    confusion_matrix = metrics.confusion_matrix(y_test, y_pred)
    stats = {'Prediction Time':elapsed_time, 'AUC':auc, 'Accuracy':accuracy, 'Precision':precision, 
             'Recall':recall, 'Confusion Matrix':confusion_matrix}
    
    log_result('  * {:.6f}s prediction time ({:.6f} s/image)'.format(elapsed_time, elapsed_time/len(y_test)))
    log_result('  * AUC (weighted): {:.9f}'.format(auc))
    log_result('  * Accuracy: {:.9f}'.format(accuracy))
    log_result('  * Precision (weighted): {:.9f}'.format(precision))
    log_result('  * Recall (weighted): {:.9f}'.format(recall))
    log_result('  * Confusion Matrix:')
    log_result(str(confusion_matrix))
    return y_pred, y_prob, stats

# Returns all image file paths detected falsely
def filter_failed_fp(y_pred, y_test, fp_test_index, fp_test):
    failed_fp = []
    for i in range(len(y_pred)):
        if y_pred[i] != y_test[i]:
            if y_pred[i] == NO_PERSON:
                label = 'FN'
            else:
                label = 'FP'
            failed_fp.append( (label, fp_test[int(fp_test_index[i])]) )
    return failed_fp

In [9]:
# 1. Generate SVM model (and training images) or load cached result
def get_svm_model(cur_dir_contents, SVM_MODEL, PRE_TRAINING_IMGS):
    global NPOS_TRAINING_IMGS,NNEG_TRAINING_IMGS
    global CACHED_UNPROC_TRAINING # training
    if SVM_MODEL not in cur_dir_contents:
        log_result('\n[Training SVM model]:')
        # get unprocessed images
        if CACHED_UNPROC_TRAINING == None: 
            x_train, y_train, fp_train = load_images(True, NPOS_TRAINING_IMGS,NNEG_TRAINING_IMGS)
            CACHED_UNPROC_TRAINING = (copy.deepcopy(x_train), copy.deepcopy(y_train), copy.deepcopy(fp_train))
        else:
            log_result('  * Loading cached unprocessed images from RAM')
            start_time = time.time()
            x_train, y_train, fp_train = copy.deepcopy(CACHED_UNPROC_TRAINING)
            log_result('    {:.3f}s loading time'.format(time.time() - start_time))
        # process images, generate model
        x_train, y_train, fp_train_index, fp_train = images_to_hog(x_train, y_train, fp_train, True, save_fn=PRE_TRAINING_IMGS)
        clf = gen_model(SVM_MODEL,x_train,y_train)
    else:
        log_result('\n[Loading cached SVM model & training images]:')
        with open(SVM_MODEL, 'rb') as fh:
            clf = pickle.load(fh)
        with open(PRE_TRAINING_IMGS, 'rb') as fh:
            x_train, y_train, fp_train_index, fp_train = pickle.load(fh)
            
    log_result('Number of training images loaded: {}'.format(len(x_train)))
    return x_train, y_train, fp_train_index, fp_train, clf

# 2. Generate test images or load cached result
def get_test_imgs(cur_dir_contents, PRE_TESTING_IMGS):
    global CACHED_UNPROC_TESTING  # testing
    # Generate test images or load cached result
    if PRE_TESTING_IMGS not in cur_dir_contents:
        log_result('\n[Generating test images]:')
        # get unprocessed images
        if CACHED_UNPROC_TESTING == None:
            x_test, y_test, fp_test = load_images(False)
            CACHED_UNPROC_TESTING = (copy.deepcopy(x_test), copy.deepcopy(y_test), copy.deepcopy(fp_test))
        else:
            log_result('  * Loading cached unprocessed test images from RAM')
            start_time = time.time()
            x_test, y_test, fp_test = copy.deepcopy(CACHED_UNPROC_TESTING)
            log_result('    {:.3f}s loading time'.format(time.time() - start_time))
        # process images, generate model
        x_test, y_test, fp_test_index, fp_test = images_to_hog(x_test, y_test, fp_test, True, save_fn=PRE_TESTING_IMGS)
    else:
        log_result('\n[Loading cached test images]:')
        with open(PRE_TESTING_IMGS, 'rb') as fh:
            x_test, y_test, fp_test_index, fp_test = pickle.load(fh)
    
    log_result('Number of testing images loaded: {}'.format(len(x_test)))
    return x_test, y_test, fp_test_index, fp_test
            
# 3. Evaluate performance (for all permutations)
#    call: run_test()
#    manual post-analysis: filter_failed_fp()

# Wrapper for single iteration. Note: all CSV write logic to be contained here. (hack)
def run_hogsvm():
    global NORIENTATIONS, CELL_PIXELSHAPE, CELLS_PER_BLOCK, BLOCK_NORM, POWER_LAW_COMPRESSION
    global RESULTS_FH, CSV_LINE
    base_fn = '_ori({})_cellpix({})_blksze({})_blknrm({})'.format(
        NORIENTATIONS, CELL_PIXELSHAPE[0], CELLS_PER_BLOCK[0], BLOCK_NORM)
    pickle_type = '.pickle'
    text_type = '.txt'
    SVM_MODEL = 'hogsvm_model' + base_fn + pickle_type
    PRE_TRAINING_IMGS = 'hogsvm_train' + base_fn + pickle_type
    PRE_TESTING_IMGS = 'hogsvm_test' + base_fn + pickle_type
    results_fn = 'hogsvm_result' + base_fn + text_type
    
    cur_dir_contents = os.listdir('.')
    RESULTS_FH = open(results_fn, 'w')
    log_result('[Current parameter sweep]:')
    log_result('  * Number of orientations: {}'.format(NORIENTATIONS))
    log_result('  * Cell pixel shape: {}'.format(CELL_PIXELSHAPE))
    log_result('  * Number of cells per block: {}'.format(CELLS_PER_BLOCK))
    log_result('  * Block normalisation method: {}'.format(BLOCK_NORM))
    log_result('  * Power law compression (preprocessing) on: {}'.format(POWER_LAW_COMPRESSION))
    # (NOTE: actually, power law is square root --> slightly different method)
    
    # load svm model and test dataset
    x_train, y_train, fp_train_index, fp_train, clf = get_svm_model(cur_dir_contents, SVM_MODEL, PRE_TRAINING_IMGS)
    x_test, y_test, fp_test_index, fp_test          = get_test_imgs(cur_dir_contents, PRE_TESTING_IMGS)
    # * (CSV): get hog shape (duplicated logic)
    CSV_LINE.append(x_train.shape[1]) # 'Feature Size'
    
    # evaluate on test and training datasets (as a crude check for overfitting)
    log_result('\n[Classifier statistics (on test data)]:')
    y_pred, y_prob, stats_test = run_test(clf, x_test, y_test)
    log_result('\n[Classifier statistics (on training data)]:')
    y_pred_training, y_prob_training, stats_train = run_test(clf, x_train, y_train)
    # * (CSV): add stats
    CSV_LINE += [stats_test['AUC'], stats_test['Accuracy'], stats_test['Precision'], 
                 stats_test['Recall'], stats_train['Accuracy'], stats_test['Prediction Time']]
    tn_teststat, fp_teststat, fn_teststat, tp_teststat = stats_test['Confusion Matrix'].ravel()
    CSV_LINE += [tp_teststat, tn_teststat, fp_teststat, fn_teststat]
    
    # identify all false results
    failed_fp = filter_failed_fp(y_pred, y_test, fp_test_index, fp_test)
    log_result('\n[Falsely detected images]:')
    for label, fp in failed_fp:
        log_result('  * {}: {}'.format(label,fp), on_console=False)

    RESULTS_FH.close()
    RESULTS_FH = None

In [10]:
# [PARAMETER SWEEP]
ntests = len(BLOCK_SIZE_LIST) * len(BLOCK_NORM_LIST) * len(CELL_PIXEL_LIST) * len(ORIENTATION_LIST)
count = 1
test_start_time = time.time()

CACHED_UNPROC_TRAINING = None
CACHED_UNPROC_TESTING = None
CSV_LINE = None

csv_fh = open('hogsvm_result_all.csv', 'w', newline='')
csv_writer = csv.writer(csv_fh)

csv_headers = ['Test', 'Cells per Block', 'Pixels per Cell', 'Orientations', 
               'Feature Size', 'AUC', 'Accuracy', 'Precision', 'Recall', 
               'Training Accuracy', 'Prediction Time (s)',
               'TP', 'TN', 'FP', 'FN'] # must write to in same order
csv_writer.writerow(csv_headers)

# block parameters
for block_size in BLOCK_SIZE_LIST:
    CELLS_PER_BLOCK = (block_size, block_size)
    for BLOCK_NORM in BLOCK_NORM_LIST:
        # cell/orientation parameters
        for cp in CELL_PIXEL_LIST:
            CELL_PIXELSHAPE = (cp,cp)
            for NORIENTATIONS in ORIENTATION_LIST:
                print('\n####[TEST {}/{}]##################################################################'.format(count,ntests))
                CSV_LINE = [count, block_size, cp, NORIENTATIONS]
                run_hogsvm()
                csv_writer.writerow(CSV_LINE)
                count += 1
# close file
csv_fh.close()


####[TEST 1/32]##################################################################
[Current parameter sweep]:
  * Number of orientations: 13
  * Cell pixel shape: (4, 4)
  * Number of cells per block: (1, 1)
  * Block normalisation method: L2-Hys
  * Power law compression (preprocessing) on: True

[Training SVM model]:
  * 1.351s runtime (images loaded): Individual_Component\train\train_positive_A\00000000
  * 1.140s runtime (images loaded): Individual_Component\train\train_positive_A\00000001
  * 1.215s runtime (images loaded): Individual_Component\train\train_positive_A\00000002
  * 1.116s runtime (images loaded): Individual_Component\train\train_negative_A\00000000
  * 1.014s runtime (images loaded): Individual_Component\train\train_negative_A\00000001
  * 1.023s runtime (images loaded): Individual_Component\train\train_negative_A\00000002
  * 46.488s runtime (conversion to HOG)
  * 0.075s runtime (shuffling)
HOG descriptor size: (4160,)
4.413s runtime (SGD training)
Number of train



6.472s runtime (SGD training)
Number of training images loaded: 6000

[Generating test images]:
  * Loading cached unprocessed test images from RAM
    0.112s loading time
  * 28.387s runtime (conversion to HOG)
  * 0.047s runtime (shuffling)
HOG descriptor size: (1040,)
Number of testing images loaded: 9457

[Classifier statistics (on test data)]:
  * 0.644294s prediction time (0.000068 s/image)
  * AUC (weighted): 0.995546813
  * Accuracy: 0.970075077
  * Precision (weighted): 0.970486644
  * Recall (weighted): 0.970075077
  * Confusion Matrix:
[[5808  192]
 [  91 3366]]

[Classifier statistics (on training data)]:
  * 0.443107s prediction time (0.000074 s/image)
  * AUC (weighted): 1.000000000
  * Accuracy: 1.000000000
  * Precision (weighted): 1.000000000
  * Recall (weighted): 1.000000000
  * Confusion Matrix:
[[3000    0]
 [   0 3000]]

[Falsely detected images]:

####[TEST 6/32]##################################################################
[Current parameter sweep]:
  * Numb



3.964s runtime (SGD training)
Number of training images loaded: 6000

[Generating test images]:
  * Loading cached unprocessed test images from RAM
    0.078s loading time
  * 22.685s runtime (conversion to HOG)
  * 0.031s runtime (shuffling)
HOG descriptor size: (728,)
Number of testing images loaded: 9457

[Classifier statistics (on test data)]:
  * 0.431482s prediction time (0.000046 s/image)
  * AUC (weighted): 0.991523720
  * Accuracy: 0.954002326
  * Precision (weighted): 0.954929767
  * Recall (weighted): 0.954002326
  * Confusion Matrix:
[[5706  294]
 [ 141 3316]]

[Classifier statistics (on training data)]:
  * 0.314855s prediction time (0.000052 s/image)
  * AUC (weighted): 0.999486889
  * Accuracy: 0.996000000
  * Precision (weighted): 0.996003527
  * Recall (weighted): 0.996000000
  * Confusion Matrix:
[[2984   16]
 [   8 2992]]

[Falsely detected images]:

####[TEST 7/32]##################################################################
[Current parameter sweep]:
  * Numbe



3.252s runtime (SGD training)
Number of training images loaded: 6000

[Generating test images]:
  * Loading cached unprocessed test images from RAM
    0.093s loading time
  * 23.773s runtime (conversion to HOG)
  * 0.031s runtime (shuffling)
HOG descriptor size: (624,)
Number of testing images loaded: 9457

[Classifier statistics (on test data)]:
  * 0.419570s prediction time (0.000044 s/image)
  * AUC (weighted): 0.994351075
  * Accuracy: 0.964999471
  * Precision (weighted): 0.965686920
  * Recall (weighted): 0.964999471
  * Confusion Matrix:
[[5767  233]
 [  98 3359]]

[Classifier statistics (on training data)]:
  * 0.236385s prediction time (0.000039 s/image)
  * AUC (weighted): 0.999622444
  * Accuracy: 0.995166667
  * Precision (weighted): 0.995166722
  * Recall (weighted): 0.995166667
  * Confusion Matrix:
[[2986   14]
 [  15 2985]]

[Falsely detected images]:

####[TEST 8/32]##################################################################
[Current parameter sweep]:
  * Numbe



1.053s runtime (SGD training)
Number of training images loaded: 6000

[Generating test images]:
  * Loading cached unprocessed test images from RAM
    0.095s loading time
  * 18.158s runtime (conversion to HOG)
  * 0.016s runtime (shuffling)
HOG descriptor size: (260,)
Number of testing images loaded: 9457

[Classifier statistics (on test data)]:
  * 0.201261s prediction time (0.000021 s/image)
  * AUC (weighted): 0.988860332
  * Accuracy: 0.951253040
  * Precision (weighted): 0.952378178
  * Recall (weighted): 0.951253040
  * Confusion Matrix:
[[5684  316]
 [ 145 3312]]

[Classifier statistics (on training data)]:
  * 0.110703s prediction time (0.000018 s/image)
  * AUC (weighted): 0.994130667
  * Accuracy: 0.966666667
  * Precision (weighted): 0.966713338
  * Recall (weighted): 0.966666667
  * Confusion Matrix:
[[2885  115]
 [  85 2915]]

[Falsely detected images]:

####[TEST 9/32]##################################################################
[Current parameter sweep]:
  * Numbe

9.349s runtime (SGD training)
Number of training images loaded: 6000

[Generating test images]:
  * Loading cached unprocessed test images from RAM
    0.093s loading time
  * 21.323s runtime (conversion to HOG)
  * 0.079s runtime (shuffling)
HOG descriptor size: (2184,)
Number of testing images loaded: 9457

[Classifier statistics (on test data)]:
  * 1.405612s prediction time (0.000149 s/image)
  * AUC (weighted): 0.996787677
  * Accuracy: 0.974093264
  * Precision (weighted): 0.974401259
  * Recall (weighted): 0.974093264
  * Confusion Matrix:
[[5834  166]
 [  79 3378]]

[Classifier statistics (on training data)]:
  * 0.871909s prediction time (0.000145 s/image)
  * AUC (weighted): 1.000000000
  * Accuracy: 1.000000000
  * Precision (weighted): 1.000000000
  * Recall (weighted): 1.000000000
  * Confusion Matrix:
[[3000    0]
 [   0 3000]]

[Falsely detected images]:

####[TEST 15/32]##################################################################
[Current parameter sweep]:
  * Num



1.761s runtime (SGD training)
Number of training images loaded: 6000

[Generating test images]:
  * Loading cached unprocessed test images from RAM
    0.101s loading time
  * 15.945s runtime (conversion to HOG)
  * 0.028s runtime (shuffling)
HOG descriptor size: (624,)
Number of testing images loaded: 9457

[Classifier statistics (on test data)]:
  * 0.390841s prediction time (0.000041 s/image)
  * AUC (weighted): 0.994862501
  * Accuracy: 0.966056889
  * Precision (weighted): 0.966705185
  * Recall (weighted): 0.966056889
  * Confusion Matrix:
[[5774  226]
 [  95 3362]]

[Classifier statistics (on training data)]:
  * 0.252060s prediction time (0.000042 s/image)
  * AUC (weighted): 0.998096444
  * Accuracy: 0.980833333
  * Precision (weighted): 0.980856895
  * Recall (weighted): 0.980833333
  * Confusion Matrix:
[[2932   68]
 [  47 2953]]

[Falsely detected images]:

####[TEST 17/32]##################################################################
[Current parameter sweep]:
  * Numb

  * 0.067s runtime (shuffling)
HOG descriptor size: (3510,)
13.721s runtime (SGD training)
Number of training images loaded: 6000

[Generating test images]:
  * Loading cached unprocessed test images from RAM
    0.079s loading time
  * 20.016s runtime (conversion to HOG)
  * 0.100s runtime (shuffling)
HOG descriptor size: (3510,)
Number of testing images loaded: 9457

[Classifier statistics (on test data)]:
  * 2.168786s prediction time (0.000229 s/image)
  * AUC (weighted): 0.996658085
  * Accuracy: 0.972084170
  * Precision (weighted): 0.972568574
  * Recall (weighted): 0.972084170
  * Confusion Matrix:
[[5811  189]
 [  75 3382]]

[Classifier statistics (on training data)]:
  * 1.415319s prediction time (0.000236 s/image)
  * AUC (weighted): 0.999973111
  * Accuracy: 0.998833333
  * Precision (weighted): 0.998833832
  * Recall (weighted): 0.998833333
  * Confusion Matrix:
[[2995    5]
 [   2 2998]]

[Falsely detected images]:

####[TEST 23/32]########################################



2.132s runtime (SGD training)
Number of training images loaded: 6000

[Generating test images]:
  * Loading cached unprocessed test images from RAM
    0.158s loading time
  * 15.431s runtime (conversion to HOG)
  * 0.030s runtime (shuffling)
HOG descriptor size: (702,)
Number of testing images loaded: 9457

[Classifier statistics (on test data)]:
  * 0.475749s prediction time (0.000050 s/image)
  * AUC (weighted): 0.994411002
  * Accuracy: 0.963307603
  * Precision (weighted): 0.964124591
  * Recall (weighted): 0.963307603
  * Confusion Matrix:
[[5752  248]
 [  99 3358]]

[Classifier statistics (on training data)]:
  * 0.352732s prediction time (0.000059 s/image)
  * AUC (weighted): 0.997484444
  * Accuracy: 0.974000000
  * Precision (weighted): 0.974007584
  * Recall (weighted): 0.974000000
  * Confusion Matrix:
[[2916   84]
 [  72 2928]]

[Falsely detected images]:

####[TEST 25/32]##################################################################
[Current parameter sweep]:
  * Numb

  * 0.077s runtime (shuffling)
HOG descriptor size: (4160,)
13.559s runtime (SGD training)
Number of training images loaded: 6000

[Generating test images]:
  * Loading cached unprocessed test images from RAM
    0.101s loading time
  * 17.933s runtime (conversion to HOG)
  * 0.157s runtime (shuffling)
HOG descriptor size: (4160,)
Number of testing images loaded: 9457

[Classifier statistics (on test data)]:
  * 2.793358s prediction time (0.000295 s/image)
  * AUC (weighted): 0.996431974
  * Accuracy: 0.969652110
  * Precision (weighted): 0.970290200
  * Recall (weighted): 0.969652110
  * Confusion Matrix:
[[5790  210]
 [  77 3380]]

[Classifier statistics (on training data)]:
  * 2.010662s prediction time (0.000335 s/image)
  * AUC (weighted): 0.999854667
  * Accuracy: 0.996333333
  * Precision (weighted): 0.996333554
  * Recall (weighted): 0.996333333
  * Confusion Matrix:
[[2988   12]
 [  10 2990]]

[Falsely detected images]:

####[TEST 31/32]########################################

In [11]:
if RESULTS_FH != None:
    RESULTS_FH.close()
print('{:.3f}s elapsed (entire test)'.format(time.time() - test_start_time))
print('DONE')

2870.591s elapsed (entire test)
DONE
