# Vehicle Detection Pipeline

#### Imports

In [1]:
import matplotlib.image as mpimg
import matplotlib.pyplot as plt
%matplotlib inline
import numpy as np
import cv2
import glob
import time
#
from sklearn.preprocessing import StandardScaler
from skimage.feature import hog
from sklearn.model_selection import train_test_split
#
import pickle

#### HOG Classification

In [None]:
def get_hog_features(img, orient, pix_per_cell, cell_per_block, 
                        vis=False, feature_vec=True):
    # Call with two outputs if vis==True
    if vis == True:
        features, hog_image = hog(img, orientations=orient, 
                                  pixels_per_cell=(pix_per_cell, pix_per_cell),
                                  cells_per_block=(cell_per_block, cell_per_block), 
                                  transform_sqrt=True, 
                                  visualise=vis, feature_vector=feature_vec)
        return features, hog_image
    # Otherwise call with one output
    else:      
        features = hog(img, orientations=orient, 
                       pixels_per_cell=(pix_per_cell, pix_per_cell),
                       cells_per_block=(cell_per_block, cell_per_block), 
                       transform_sqrt=True, 
                       visualise=vis, feature_vector=feature_vec)
        return features

# Define a function to compute binned color features  
def bin_spatial(img, size=(32, 32)):
    # Use cv2.resize().ravel() to create the feature vector
    features = cv2.resize(img, size).ravel() 
    # Return the feature vector
    return features

# Define a function to compute color histogram features 
# NEED TO CHANGE bins_range if reading .png files with mpimg!
def color_hist(img, nbins=32, bins_range=(0, 256)):
    # Compute the histogram of the color channels separately
    channel1_hist = np.histogram(img[:,:,0], bins=nbins, range=bins_range)
    channel2_hist = np.histogram(img[:,:,1], bins=nbins, range=bins_range)
    channel3_hist = np.histogram(img[:,:,2], bins=nbins, range=bins_range)
    # Concatenate the histograms into a single feature vector
    hist_features = np.concatenate((channel1_hist[0], channel2_hist[0], channel3_hist[0]))
    # Return the individual histograms, bin_centers and feature vector
    return hist_features

# Define a function to extract features from a list of images
# Have this function call bin_spatial() and color_hist()
def extract_features(imgs, color_space='RGB', spatial_size=(32, 32),
                        hist_bins=32, orient=9, 
                        pix_per_cell=8, cell_per_block=2, hog_channel=0,
                        spatial_feat=True, hist_feat=True, hog_feat=True):
    # Create a list to append feature vectors to
    features = []
    # Iterate through the list of images
    for file in imgs:
        file_features = []
        # Read in each one by one
        image = mpimg.imread(file)
        # apply color conversion if other than 'RGB'
        if color_space != 'RGB':
            if color_space == 'HSV':
                feature_image = cv2.cvtColor(image, cv2.COLOR_RGB2HSV)
            elif color_space == 'LUV':
                feature_image = cv2.cvtColor(image, cv2.COLOR_RGB2LUV)
            elif color_space == 'HLS':
                feature_image = cv2.cvtColor(image, cv2.COLOR_RGB2HLS)
            elif color_space == 'YUV':
                feature_image = cv2.cvtColor(image, cv2.COLOR_RGB2YUV)
            elif color_space == 'YCrCb':
                feature_image = cv2.cvtColor(image, cv2.COLOR_RGB2YCrCb)
        else: feature_image = np.copy(image)      
        
        if spatial_feat == True:
            spatial_features = bin_spatial(feature_image, size=spatial_size)
            file_features.append(spatial_features)
        if hist_feat == True:
            # Apply color_hist()
            hist_features = color_hist(feature_image, nbins=hist_bins)
            file_features.append(hist_features)
        if hog_feat == True:
        # Call get_hog_features() with vis=False, feature_vec=True
            if hog_channel == 'ALL':
                hog_features = []
                for channel in range(feature_image.shape[2]):
                    hog_features.append(get_hog_features(feature_image[:,:,channel], 
                                        orient, pix_per_cell, cell_per_block, 
                                        vis=False, feature_vec=True))
                hog_features = np.ravel(hog_features)        
            else:
                hog_features = get_hog_features(feature_image[:,:,hog_channel], orient, 
                            pix_per_cell, cell_per_block, vis=False, feature_vec=True)
            # Append the new feature vector to the features list
            file_features.append(hog_features)
        features.append(np.concatenate(file_features))
    # Return list of feature vectors
    return features

#### Drawing Boxes

In [None]:
def draw_boxes(img, bboxes, color=(0, 0, 255), thick=6):
    # Make a copy of the image
    imcopy = np.copy(img)
    # Iterate through the bounding boxes
    for bbox in bboxes:
        # Draw a rectangle given bbox coordinates
        cv2.rectangle(imcopy, bbox[0], bbox[1], color, thick)
    # Return the image copy with boxes drawn
    return imcopy
    
    
# Define a function that takes an image,
# start and stop positions in both x and y, 
# window size (x and y dimensions),  
# and overlap fraction (for both x and y)
def slide_window(img, x_start_stop=[None, None], y_start_stop=[None, None], 
                    xy_window=(64, 64), xy_overlap=(0.5, 0.5)):
    # If x and/or y start/stop positions not defined, set to image size
    if x_start_stop[0] == None:
        x_start_stop[0] = 0
    if x_start_stop[1] == None:
        x_start_stop[1] = img.shape[1]
    if y_start_stop[0] == None:
        y_start_stop[0] = 0
    if y_start_stop[1] == None:
        y_start_stop[1] = img.shape[0]
    # Compute the span of the region to be searched    
    xspan = x_start_stop[1] - x_start_stop[0]
    yspan = y_start_stop[1] - y_start_stop[0]
    # Compute the number of pixels per step in x/y
    nx_pix_per_step = np.int(xy_window[0]*(1 - xy_overlap[0]))
    ny_pix_per_step = np.int(xy_window[1]*(1 - xy_overlap[1]))
    # Compute the number of windows in x/y
    nx_buffer = np.int(xy_window[0]*(xy_overlap[0]))
    ny_buffer = np.int(xy_window[1]*(xy_overlap[1]))
    nx_windows = np.int((xspan-nx_buffer)/nx_pix_per_step) 
    ny_windows = np.int((yspan-ny_buffer)/ny_pix_per_step) 
    # Initialize a list to append window positions to
    window_list = []
    # Loop through finding x and y window positions
    # Note: you could vectorize this step, but in practice
    # you'll be considering windows one by one with your
    # classifier, so looping makes sense
    for ys in range(ny_windows):
        for xs in range(nx_windows):
            # Calculate window position
            startx = xs*nx_pix_per_step + x_start_stop[0]
            endx = startx + xy_window[0]
            starty = ys*ny_pix_per_step + y_start_stop[0]
            endy = starty + xy_window[1]
            # Append window position to list
            window_list.append(((startx, starty), (endx, endy)))
    # Return the list of windows
    return window_list

In [None]:
# Define a function to extract features from a single image window
# This function is very similar to extract_features()
# just for a single image rather than list of images
def single_img_features(img, color_space='RGB', spatial_size=(32, 32),
                        hist_bins=32, orient=9, 
                        pix_per_cell=8, cell_per_block=2, hog_channel=0,
                        spatial_feat=True, hist_feat=True, hog_feat=True):    
    #1) Define an empty list to receive features
    img_features = []
    #2) Apply color conversion if other than 'RGB'
    if color_space != 'RGB':
        if color_space == 'HSV':
            feature_image = cv2.cvtColor(img, cv2.COLOR_RGB2HSV)
        elif color_space == 'LUV':
            feature_image = cv2.cvtColor(img, cv2.COLOR_RGB2LUV)
        elif color_space == 'HLS':
            feature_image = cv2.cvtColor(img, cv2.COLOR_RGB2HLS)
        elif color_space == 'YUV':
            feature_image = cv2.cvtColor(img, cv2.COLOR_RGB2YUV)
        elif color_space == 'YCrCb':
            feature_image = cv2.cvtColor(img, cv2.COLOR_RGB2YCrCb)
    else: feature_image = np.copy(img)      
    #3) Compute spatial features if flag is set
    if spatial_feat == True:
        spatial_features = bin_spatial(feature_image, size=spatial_size)
        #4) Append features to list
        img_features.append(spatial_features)
    #5) Compute histogram features if flag is set
    if hist_feat == True:
        hist_features = color_hist(feature_image, nbins=hist_bins)
        #6) Append features to list
        img_features.append(hist_features)
    #7) Compute HOG features if flag is set
    if hog_feat == True:
        if hog_channel == 'ALL':
            hog_features = []
            for channel in range(feature_image.shape[2]):
                hog_features.extend(get_hog_features(feature_image[:,:,channel], 
                                    orient, pix_per_cell, cell_per_block, 
                                    vis=False, feature_vec=True))      
        else:
            hog_features = get_hog_features(feature_image[:,:,hog_channel], orient, 
                        pix_per_cell, cell_per_block, vis=False, feature_vec=True)
        #8) Append features to list
        img_features.append(hog_features)

    #9) Return concatenated array of features
    return np.concatenate(img_features)

# Define a function you will pass an image 
# and the list of windows to be searched (output of slide_windows())
def search_windows(img, windows, clf, scaler, color_space='RGB', 
                    spatial_size=(32, 32), hist_bins=32, 
                    hist_range=(0, 256), orient=9, 
                    pix_per_cell=8, cell_per_block=2, 
                    hog_channel=0, spatial_feat=True, 
                    hist_feat=True, hog_feat=True):

    #1) Create an empty list to receive positive detection windows
    on_windows = []
    #2) Iterate over all windows in the list
    for window in windows:
        #3) Extract the test window from original image
        test_img = cv2.resize(img[window[0][1]:window[1][1], window[0][0]:window[1][0]], (64, 64))      
        #4) Extract features for that window using single_img_features()
        features = single_img_features(test_img, color_space=color_space, 
                            spatial_size=spatial_size, hist_bins=hist_bins, 
                            orient=orient, pix_per_cell=pix_per_cell, 
                            cell_per_block=cell_per_block, 
                            hog_channel=hog_channel, spatial_feat=spatial_feat, 
                            hist_feat=hist_feat, hog_feat=hog_feat)
        #5) Scale extracted features to be fed to classifier
        test_features = scaler.transform(np.array(features).reshape(1, -1))
        #6) Predict using your classifier
        prediction = clf.predict(test_features)
        #7) If positive (prediction == 1) then save the window
        if prediction == 1:
            on_windows.append(window)
    #8) Return windows for positive detections
    return on_windows

In [None]:
test_images = glob.glob("./test_images/*.jpg")
for fname in test_images:
    img = cv2.imread(fname)
    img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
    f, ax1 = plt.subplots(1, 1, figsize=(24, 9))
    f.tight_layout()
    ax1.imshow(img)
    ax1.set_title('Original Image', fontsize=25)
    cv2.waitKey(200)

In [None]:
def convert_color(img, conv='RGB2YCrCb'):
    if conv == 'YCrCb':
        return cv2.cvtColor(img, cv2.COLOR_RGB2YCrCb)
    if conv == 'BGR2YCrCb':
        return cv2.cvtColor(img, cv2.COLOR_BGR2YCrCb)
    if conv == 'LUV':
        return cv2.cvtColor(img, cv2.COLOR_RGB2LUV)
    if conv == 'YUV':
        return cv2.cvtColor(img, cv2.COLOR_RGB2YUV)
    if conv == 'HSV':
        return cv2.cvtColor(img, cv2.COLOR_RGB2HSV)
    if conv == 'HLS':
        return cv2.cvtColor(img, cv2.COLOR_RGB2HLS)
    if conv == 'RGB':
        return img

# Define a single function that can extract features using hog sub-sampling and make predictions
def find_cars(img, ystart, ystop, scale, svc, X_scaler, orient, pix_per_cell, cell_per_block, spatial_size, hist_bins,
             cells_per_step=2, color_conv='YCrCb'):
    
    draw_img = np.copy(img)
    img = img.astype(np.float32)/255
    img_tosearch = img[ystart:ystop,:,:]    
    bbox_list = []
    
    ctrans_tosearch = convert_color(img_tosearch, conv=color_conv)
    if scale != 1:
        imshape = ctrans_tosearch.shape
        ctrans_tosearch = cv2.resize(ctrans_tosearch, (np.int(imshape[1]/scale), np.int(imshape[0]/scale)))
        
    ch1 = ctrans_tosearch[:,:,0]
    ch2 = ctrans_tosearch[:,:,1]
    ch3 = ctrans_tosearch[:,:,2]

    # Define blocks and steps as above
    nxblocks = (ch1.shape[1] // pix_per_cell) - cell_per_block + 1
    nyblocks = (ch1.shape[0] // pix_per_cell) - cell_per_block + 1 
    nfeat_per_block = orient*cell_per_block**2
    
    # 64 was the orginal sampling rate, with 8 cells and 8 pix per cell
    window = 64
    nblocks_per_window = (window // pix_per_cell) - cell_per_block + 1
    nxsteps = (nxblocks - nblocks_per_window) // cells_per_step
    nysteps = (nyblocks - nblocks_per_window) // cells_per_step
    
    # Compute individual channel HOG features for the entire image
    hog1 = get_hog_features(ch1, orient, pix_per_cell, cell_per_block, feature_vec=False)
    #print(hog1.shape)
    hog2 = get_hog_features(ch2, orient, pix_per_cell, cell_per_block, feature_vec=False)
    hog3 = get_hog_features(ch3, orient, pix_per_cell, cell_per_block, feature_vec=False)
    
    for xb in range(nxsteps):
        for yb in range(nysteps):
            ypos = yb*cells_per_step
            xpos = xb*cells_per_step
            # Extract HOG for this patch
            hog_feat1 = hog1[ypos:ypos+nblocks_per_window, xpos:xpos+nblocks_per_window].ravel() 
            hog_feat2 = hog2[ypos:ypos+nblocks_per_window, xpos:xpos+nblocks_per_window].ravel() 
            hog_feat3 = hog3[ypos:ypos+nblocks_per_window, xpos:xpos+nblocks_per_window].ravel() 
            hog_features = np.hstack((hog_feat1, hog_feat2, hog_feat3))

            xleft = xpos*pix_per_cell
            ytop = ypos*pix_per_cell

            # Extract the image patch
            subimg = cv2.resize(ctrans_tosearch[ytop:ytop+window, xleft:xleft+window], (64,64))
          
            # Get color features
            spatial_features = bin_spatial(subimg, size=spatial_size)
            hist_features = color_hist(subimg, nbins=hist_bins)

            # Scale features and make a prediction
            test_features = X_scaler.transform(np.hstack((spatial_features, hist_features, hog_features)).reshape(1, -1))    
            #test_features = X_scaler.transform(np.hstack((shape_feat, hist_feat)).reshape(1, -1))    
            test_prediction = svc.predict(test_features)
            
            if test_prediction == 1:
                xbox_left = np.int(xleft*scale)
                ytop_draw = np.int(ytop*scale)
                win_draw = np.int(window*scale)
                bbox_list.append([(xbox_left, ytop_draw+ystart), (xbox_left+win_draw,ytop_draw+win_draw+ystart)])
                #cv2.rectangle(draw_img,(xbox_left, ytop_draw+ystart),(xbox_left+win_draw,ytop_draw+win_draw+ystart),(0,0,255),6) 
                
    return bbox_list

### Testbed

#### 1 | Train SVC

In [None]:
from sklearn.svm import LinearSVC
extra_images = glob.glob('./non-vehicles/Extras/*.png')
car_images = glob.glob('./vehicles/KITTI_extracted/*.png')
cars = []
notcars = []
# images are PNGs
for img in extra_images:
    notcars.append(img)
for img in car_images:
    cars.append(img)
print("# of car images:{}".format(len(cars)))
print("# of non-car images:{}".format(len(notcars)))
#
sample_size = 1500
cars = cars[0:sample_size]
notcars = notcars[0:sample_size]

### TODO: Tweak these parameters and see how the results change.
color_space = 'YCrCb' # Can be RGB, HSV, LUV, HLS, YUV, YCrCb
orient = 9  # HOG orientations
pix_per_cell = 8 # HOG pixels per cell
cell_per_block = 2 # HOG cells per block
hog_channel = 'ALL' # Can be 0, 1, 2, or "ALL"
spatial_size = (16, 16) # Spatial binning dimensions
hist_bins = 16    # Number of histogram bins
spatial_feat = True # Spatial features on or off
hist_feat = True # Histogram features on or off
hog_feat = True # HOG features on or off
y_start_stop = [400, None] # Min and max in y to search in slide_window()

# extract features from training images
car_features = extract_features(cars, color_space, spatial_size, hist_bins, orient, pix_per_cell, 
                        cell_per_block, hog_channel, spatial_feat, hist_feat, hog_feat)
notcar_features = extract_features(notcars, color_space, spatial_size, hist_bins, orient, pix_per_cell, 
                        cell_per_block, hog_channel, spatial_feat, hist_feat, hog_feat)

#
X = np.vstack((car_features, notcar_features)).astype(np.float64)                        
# Fit a per-column scaler
X_scaler = StandardScaler().fit(X)
# Apply the scaler to X
scaled_X = X_scaler.transform(X)
y = np.hstack((np.ones(len(car_features)), np.zeros(len(notcar_features))))

rand_state = 42#np.random.randint(0, 100)
# split
X_train, X_test, y_train, y_test = train_test_split(
    scaled_X, y, test_size=0.33, random_state=rand_state)
#
print('Using:',orient,'orientations',pix_per_cell,
    'pixels per cell and', cell_per_block,'cells per block')
print('Feature vector length:', len(X_train[0]))
# Use a linear SVC 
svc = LinearSVC(C=0.01)
# Check the training time for the SVC
t=time.time()
svc.fit(X_train, y_train)
t2 = time.time()
print(round(t2-t, 2), 'Seconds to train SVC...')
# Check the score of the SVC
print('Test Accuracy of SVC = ', round(svc.score(X_test, y_test), 4))
# Check the prediction time for a single sample
t=time.time()

#### 2 | Sliding Windows

In [None]:
image = mpimg.imread('./test_images/test6.jpg')
draw_image = np.copy(image)
windows = slide_window(image, x_start_stop=[None, None], y_start_stop=y_start_stop, 
                    xy_window=(24, 24), xy_overlap=(0.5, 0.5))
hot_windows = search_windows(image, windows, svc, X_scaler, color_space=color_space, 
                        spatial_size=spatial_size, hist_bins=hist_bins, 
                        orient=orient, pix_per_cell=pix_per_cell, 
                        cell_per_block=cell_per_block, 
                        hog_channel=hog_channel, spatial_feat=spatial_feat, 
                        hist_feat=hist_feat, hog_feat=hog_feat)                       

window_img = draw_boxes(draw_image, hot_windows, color=(0, 0, 255), thick=3)                    

plt.imshow(window_img)

In [None]:
image = mpimg.imread('./test_images/test6.jpg')
ystart = 400
ystop = 656
scale = 2.0
bbox_list = find_cars(image, ystart, ystop, scale, svc, X_scaler, orient, pix_per_cell,
                      cell_per_block, spatial_size, hist_bins)
draw_img = np.copy(image)
for box in bbox_list:
    pt1 = box[0]
    pt2 = box[1]
    cv2.rectangle(draw_img, pt1, pt2, (0,0,255),3) 
plt.imshow(draw_img)

### Pipeline

#### 1 | Train SVC

In [None]:
from sklearn.svm import LinearSVC

def train_SVC(color_space='YCrCb', # Can be RGB, HSV, LUV, HLS, YUV, YCrCb
              orient=9,  # HOG orientations
              pix_per_cell=8, # HOG pixels per cell
              cell_per_block=2, # HOG cells per block
              hog_channel='ALL', # Can be 0, 1, 2, or "ALL"
              spatial_size=(16, 16), # Spatial binning dimensions
              hist_bins=16,    # Number of histogram bins
              spatial_feat=True, # Spatial features on or off
              hist_feat=True, # Histogram features on or off
              hog_feat=True, # HOG features on or off
              y_start_stop=[400, None], # Min and max in y to search in slide_window()
              cost=0.1 # Penalty parameter for error term of LinearSVC()
             ):
    extra_images = glob.glob('./non-vehicles/Extras/*.png')
    car_images = glob.glob('./vehicles/KITTI_extracted/*.png')
    cars = []
    notcars = []
    # images are PNGs
    for img in extra_images:
        notcars.append(img)
    for img in car_images:
        cars.append(img)
    print("# of car images:{}".format(len(cars)))
    print("# of non-car images:{}".format(len(notcars)))
    # extract features from training images
    car_features = extract_features(cars, color_space, spatial_size, hist_bins, orient, pix_per_cell, 
                        cell_per_block, hog_channel, spatial_feat, hist_feat, hog_feat)
    notcar_features = extract_features(notcars, color_space, spatial_size, hist_bins, orient, pix_per_cell, 
                        cell_per_block, hog_channel, spatial_feat, hist_feat, hog_feat)
    #
    X = np.vstack((car_features, notcar_features)).astype(np.float64)                        
    # Fit a per-column scaler
    X_scaler = StandardScaler().fit(X)
    # Apply the scaler to X
    scaled_X = X_scaler.transform(X)
    y = np.hstack((np.ones(len(car_features)), np.zeros(len(notcar_features))))

    rand_state = 42
    # split
    X_train, X_test, y_train, y_test = train_test_split(
        scaled_X, y, test_size=0.33, random_state=rand_state)
    #
    print('Using:',orient,'orientations',pix_per_cell,
        'pixels per cell and', cell_per_block,'cells per block')
    print('Feature vector length:', len(X_train[0]))
    # Use a linear SVC 
    svc = LinearSVC(C=cost)
    # Check the training time for the SVC
    t=time.time()
    svc.fit(X_train, y_train)
    t2 = time.time()
    print(round(t2-t, 2), 'Seconds to train SVC...')
    # Check the score of the SVC
    print('Test Accuracy of SVC = ', round(svc.score(X_test, y_test), 4))
    # Check the prediction time for a single sample
    t=time.time()
    return svc, X_scaler

#### 2 | Find Cars Using HOG Sub-sampling Window Search

In [None]:
def find_cars_multi_scale(image, svc, X_scaler, orient, pix_per_cell, cell_per_block, spatial_size, hist_bins,
                          scale_list=[0.75, 1.5, 2.0, 2.25, 2.5, 3.0], color_conv='YCrCb'):
    bbox_list = []
    for sc in scale_list:
        if sc <= 1.5: ystart, ystop = 420, 600
        elif sc <= 2.5: ystart, ystop = 500, 650
        else: ystart, ystop = 550, 675
        boxes = find_cars(image, ystart, ystop, sc, svc, X_scaler, orient, pix_per_cell,
                      cell_per_block, spatial_size, hist_bins, color_conv=color_conv)
        bbox_list.extend(boxes)
    return bbox_list

#### 3 | Heat Map, Threshold, Labeling and Drawing

In [None]:
def add_heat(heatmap, bbox_list):
    for box in bbox_list:
        #print(box[0])
        #print(box[1])
        #print(heatmap.shape)
        #print("Y: {0} to {1}".format(box[0][1], box[1][1]))
        #print("X: {0} to {1}".format(box[0][0], box[1][0]))
        heatmap[box[0][1]:box[1][1], box[0][0]:box[1][0]] += 1
    return heatmap

def apply_threshold(heatmap, threshold=2):
    heatmap[heatmap <= threshold] = 0
    return heatmap

from scipy.ndimage.measurements import label
def apply_label(heatmap):
    labels = label(heatmap)
    return labels

def draw_labeled_bboxes(img, labels):
    draw_img = np.copy(img)
    for car_number in range(1, labels[1]+1):
        # Find pixels with each car_number label value
        nonzero = (labels[0] == car_number).nonzero()
        # Identify x and y values of those pixels
        nonzeroy = np.array(nonzero[0])
        nonzerox = np.array(nonzero[1])
        # Define a bounding box based on min/max x and y
        bbox = ((np.min(nonzerox), np.min(nonzeroy)), (np.max(nonzerox), np.max(nonzeroy)))
        # Draw the box on the image
        cv2.rectangle(draw_img, bbox[0], bbox[1], (0,0,255), 6)
    # Return the image
    return draw_img

### Running the Pipeline

In [None]:
color_space = 'HLS' # Can be RGB, HSV, LUV, HLS, YUV, YCrCb
orient = 9  # HOG orientations
pix_per_cell = 8 # HOG pixels per cell
cell_per_block = 2 # HOG cells per block
hog_channel = 'ALL' # Can be 0, 1, 2, or "ALL"
spatial_size = (16, 16) # Spatial binning dimensions
hist_bins = 16    # Number of histogram bins
spatial_feat = True # Spatial features on or off
hist_feat = True # Histogram features on or off
hog_feat = True # HOG features on or off
#
svc, X_scaler = train_SVC(cost=0.1, color_space=color_space)
def vehicle_detection_pipeline(img):
    global heatmap
    scale_list = [1.0, 1.5, 2.0]#, 3.0, 3.75]
    bbox_list = find_cars_multi_scale(img, svc, X_scaler, orient, pix_per_cell,
                      cell_per_block, spatial_size, hist_bins, scale_list, color_conv=color_space)
    draw_img = np.copy(img)
    for box in bbox_list:
        cv2.rectangle(draw_img, box[0], box[1], (0,0,255), 3)
    heatmap = add_heat(heatmap, bbox_list)
    heatmap = apply_threshold(heatmap, threshold=2)
    labels = apply_label(heatmap)
    output_img = draw_labeled_bboxes(img, labels)
    #plt.imshow(heatmap)
    #cv2.waitKey(200)
    return draw_img
    
    

In [None]:
from moviepy.editor import VideoFileClip
from IPython.display import HTML
#
heatmap = np.zeros((1280, 720), dtype=np.int16)
input_clip = './project_video.mp4'
clip = VideoFileClip(input_clip).subclip(5,45)
output_clip = './project_video_output.mp4'
output = clip.fl_image(vehicle_detection_pipeline)
%time output.write_videofile(output_clip, audio=False)

In [None]:
HTML("""
<video width="960" height="540" controls>
<source src="{0}"> </video>
""".format(output_clip))

## New Code

In [None]:
def get_hog_features(img, orient, pix_per_cell, cell_per_block, 
                        vis=False, feature_vec=True):
    # Call with two outputs if vis==True
    if vis == True:
        features, hog_image = hog(img, orientations=orient, 
                                  pixels_per_cell=(pix_per_cell, pix_per_cell),
                                  cells_per_block=(cell_per_block, cell_per_block), 
                                  transform_sqrt=True, 
                                  visualise=vis, feature_vector=feature_vec)
        return features, hog_image
    # Otherwise call with one output
    else:      
        features = hog(img, orientations=orient, 
                       pixels_per_cell=(pix_per_cell, pix_per_cell),
                       cells_per_block=(cell_per_block, cell_per_block), 
                       transform_sqrt=True, 
                       visualise=vis, feature_vector=feature_vec)
        return features

def extract_HOG_features(img, orient=9, pix_per_cell=8, cell_per_block=2):    
    img_cpy = np.copy(img)
    hog_features = get_hog_features(img_cpy, orient, pix_per_cell, cell_per_block, vis=False, feature_vec=True)
    hog_features = np.ravel(hog_features)
    return hog_features


def find_cars_HOG(img, ystart, ystop, scale, svc, X_scaler, orient, pix_per_cell, cell_per_block, cells_per_step=2):
    
    #draw_img = np.copy(img)
    img = img.astype(np.float32)/255
    ctrans_tosearch = img[ystart:ystop,:]    
    bbox_list = []
    
    if scale != 1:
        imshape = ctrans_tosearch.shape
        ctrans_tosearch = cv2.resize(ctrans_tosearch, (np.int(imshape[1]/scale), np.int(imshape[0]/scale)))
        
    ch1 = ctrans_tosearch

    # Define blocks and steps as above
    nxblocks = (ch1.shape[1] // pix_per_cell) - cell_per_block + 1
    nyblocks = (ch1.shape[0] // pix_per_cell) - cell_per_block + 1 
    nfeat_per_block = orient*cell_per_block**2
    
    
    
    # 64 was the orginal sampling rate, with 8 cells and 8 pix per cell
    window = 64
    nblocks_per_window = (window // pix_per_cell) - cell_per_block + 1
    nxsteps = (nxblocks - nblocks_per_window) // cells_per_step
    nysteps = (nyblocks - nblocks_per_window) // cells_per_step
    
    #t0=time.time()
    # Compute individual channel HOG features for the entire image
    hog1 = get_hog_features(ch1, orient, pix_per_cell, cell_per_block, feature_vec=False)
    #t1 = time.time()
    #print("hog1 time: {}".format(round(t1-t0, 2)))
    
    #t0=time.time()
    for xb in range(nxsteps):
        for yb in range(nysteps):
            ypos = yb*cells_per_step
            xpos = xb*cells_per_step
            # Extract HOG for this patch
            hog_feat1 = hog1[ypos:ypos+nblocks_per_window, xpos:xpos+nblocks_per_window].ravel()
            hog_features = hog_feat1
            #print("hog_features vec shape: {}".format(hog_features.shape))

            xleft = xpos*pix_per_cell
            ytop = ypos*pix_per_cell

            # Extract the image patch
            subimg = cv2.resize(ctrans_tosearch[ytop:ytop+window, xleft:xleft+window], (64,64))

            # Scale features and make a prediction
            #test_features = X_scaler.transform(np.hstack((hog_features)).reshape(1, -1))
            test_features = X_scaler.transform(hog_features)
            #t0=time.time()
            test_prediction = svc.predict(test_features)
            #t1 = time.time()
            #print("predict time: {}".format(round(t1-t0, 2)))
    
            if test_prediction == 1:
                xbox_left = np.int(xleft*scale)
                ytop_draw = np.int(ytop*scale)
                win_draw = np.int(window*scale)
                bbox_list.append([(xbox_left, ytop_draw+ystart), (xbox_left+win_draw,ytop_draw+win_draw+ystart)])
    #t1=time.time()
    #print("xy 2-loop time: {}".format(round(t1-t0, 2)))        
    return bbox_list


In [None]:
from sklearn.svm import LinearSVC

def train_SVC_HOG(#color_space='YCrCb', # Can be RGB, HSV, LUV, HLS, YUV, YCrCb
              orient=9,  # HOG orientations
              pix_per_cell=8, # HOG pixels per cell
              cell_per_block=2, # HOG cells per block
              #y_start_stop=[400, 720], # Min and max in y to search in slide_window()
              cost=0.1 # Penalty parameter for error term of LinearSVC()
             ):
    extra_images = glob.glob('./non-vehicles/Extras/*.png')
    car_images = glob.glob('./vehicles/KITTI_extracted/*.png')
    cars = []
    notcars = []
    # images are PNGs
    for fname in car_images:
        cars.append(fname)
    for fname in extra_images:
        notcars.append(fname)
    print("# of car images:{}".format(len(cars)))
    print("# of non-car images:{}".format(len(notcars)))
    # extract features from training images
    car_features = []
    notcar_features = []
    for fname in cars:
        img = cv2.imread(fname, cv2.IMREAD_GRAYSCALE)
        car_features.append(extract_HOG_features(img, orient, pix_per_cell, cell_per_block))
        #print("car features shape: {}".format(car_features[-1].shape))
    for fname in notcars:
        img = cv2.imread(fname, cv2.IMREAD_GRAYSCALE)
        notcar_features.append(extract_HOG_features(img, orient, pix_per_cell, cell_per_block))
    #
    X = np.vstack((car_features, notcar_features)).astype(np.float64)                        
    # Fit a per-column scaler
    X_scaler = StandardScaler().fit(X)
    # Apply the scaler to X
    scaled_X = X_scaler.transform(X)
    y = np.hstack((np.ones(len(car_features)), np.zeros(len(notcar_features))))

    rand_state = 42
    # split
    X_train, X_test, y_train, y_test = train_test_split(
        scaled_X, y, test_size=0.33, random_state=rand_state)
    #
    print('Using:',orient,'orientations',pix_per_cell, 'pixels per cell and', cell_per_block,'cells per block')
    print('Feature vector length:', len(X_train[0]))
    # Use a linear SVC 
    svc = LinearSVC(C=cost)
    # Check the training time for the SVC
    t=time.time()
    svc.fit(X_train, y_train)
    t2 = time.time()
    print(round(t2-t, 2), 'Seconds to train SVC...')
    # Check the score of the SVC
    print('Test Accuracy of SVC = ', round(svc.score(X_test, y_test), 4))
    # Check the prediction time for a single sample
    t=time.time()
    return svc, X_scaler

In [None]:
orient = 9  # HOG orientations
pix_per_cell = 4 # HOG pixels per cell
cell_per_block = 2 # HOG cells per block
svc, X_scaler = train_SVC_HOG(cost=0.1,
                              orient=orient,  # HOG orientations
                              pix_per_cell=pix_per_cell, # HOG pixels per cell
                              cell_per_block=cell_per_block)

In [None]:
ystart, ystop = 380, 720
scale = 1.75
def vehicle_detection_pipeline_HOG(img):
    gray_img = cv2.cvtColor(img, cv2.COLOR_RGB2GRAY)
    bbox_list = find_cars_HOG(gray_img, ystart, ystop, scale, svc, X_scaler, orient, pix_per_cell, cell_per_block, cells_per_step=2)
    draw_img = np.copy(img)
    for box in bbox_list:
        cv2.rectangle(draw_img, box[0], box[1], (0,0,255), 3)
    return draw_img

In [None]:
from moviepy.editor import VideoFileClip
from IPython.display import HTML
#
input_clip = './project_video.mp4'
clip = VideoFileClip(input_clip).subclip(5,10)
output_clip = './project_video_temp.mp4'
output = clip.fl_image(vehicle_detection_pipeline_HOG)
%time output.write_videofile(output_clip, audio=False)

In [None]:
HTML("""
<video width="960" height="540" controls>
<source src="{0}"> </video>
""".format(output_clip))

In [None]:
orient = 9  # HOG orientations
pix_per_cell = 8 # HOG pixels per cell
cell_per_block = 2 # HOG cells per block
#
image = cv2.imread('./test_images/test1.jpg', 0)
image = image[ystart:ystop,:]
ft, hog_image = get_hog_features(image, orient, pix_per_cell, cell_per_block, vis=True, feature_vec=True)
ft2 = get_hog_features(image, orient, pix_per_cell, cell_per_block, feature_vec=False)
print("feature vec shape: {}".format(ft2.shape))
ft2 = np.ravel(ft2)
print("feature vec shape raveled: {}".format(ft2.shape))
#
from skimage import data, color, exposure
k=6
fig, (ax1, ax2) = plt.subplots(2, 1, figsize=(k*8, k*4), sharex=True, sharey=True)

ax1.axis('off')
ax1.imshow(image, cmap=plt.cm.gray)
ax1.set_title('Input image')
ax1.set_adjustable('box-forced')

# Rescale histogram for better display
#hog_image_rescaled = exposure.rescale_intensity(hog_image, in_range=(0.25, 1.))

ax2.axis('off')
ax2.imshow(hog_image, cmap=plt.cm.gray)
ax2.set_title('Histogram of Oriented Gradients')
ax1.set_adjustable('box-forced')
plt.show()

#
ch1 = image
ctrans_tosearch = ch1
print("pix_per_cell: {}".format(pix_per_cell))
print("cell_per_block: {}".format(cell_per_block))
nxblocks = (ch1.shape[1] // pix_per_cell) - cell_per_block + 1
nyblocks = (ch1.shape[0] // pix_per_cell) - cell_per_block + 1 
nfeat_per_block = orient*cell_per_block**2
print("nxblocks: {}".format(nxblocks))
print("nyblocks: {}".format(nyblocks))
print("nfeat_per_block: {}".format(nfeat_per_block))
    
# 64 was the orginal sampling rate, with 8 cells and 8 pix per cell
cells_per_step=2
window = 64
nblocks_per_window = (window // pix_per_cell) - cell_per_block + 1
nxsteps = (nxblocks - nblocks_per_window) // cells_per_step
nysteps = (nyblocks - nblocks_per_window) // cells_per_step
print("nblocks_per_window: {}".format(nblocks_per_window))
print("nxsteps: {}".format(nxsteps))
print("nysteps: {}".format(nysteps))

# Compute individual channel HOG features for the entire image
hog1 = get_hog_features(ch1, orient, pix_per_cell, cell_per_block, feature_vec=False)
print("hog1 vec shape: {}".format(hog1.shape))

yb, xb = 1, 1
ypos = yb*cells_per_step
xpos = xb*cells_per_step
# Extract HOG for this patch
print("ypos: {}".format(ypos))
print("xpos: {}".format(xpos))
hog_feat1 = hog1[ypos:ypos+nblocks_per_window, xpos:xpos+nblocks_per_window].ravel()
hog_features = np.hstack((hog_feat1))
print("hog_features vec shape: {}".format(hog_features.shape))

xleft = xpos*pix_per_cell
ytop = ypos*pix_per_cell
print("xleft: {}".format(xleft))
print("ytop: {}".format(ytop))


# Extract the image patch
subimg = cv2.resize(ctrans_tosearch[ytop:ytop+window, xleft:xleft+window], (64,64))
plt.imshow(subimg, cmap='gray')
sub_ft = get_hog_features(subimg, orient, pix_per_cell, cell_per_block, feature_vec=False)
print("sub_ft feature_vec: {}".format(sub_ft.shape))
sub_ft = sub_ft.ravel()
print("sub_ft feature_vec raveled: {}".format(sub_ft.shape))
# Scale features and make a prediction
#test_features = X_scaler.transform(np.hstack((hog_features)).reshape(1, -1))     
#test_prediction = svc.predict(test_features)

#if test_prediction == 1:
#    xbox_left = np.int(xleft*scale)
#    ytop_draw = np.int(ytop*scale)
#    win_draw = np.int(window*scale)
#    bbox_list.append([(xbox_left, ytop_draw+ystart), (xbox_left+win_draw,ytop_draw+win_draw+ystart)])


In [None]:
extra_images = glob.glob('./non-vehicles/Extras/*.png')
car_images = glob.glob('./vehicles/KITTI_extracted/*.png')
cars = []
notcars = []
# images are PNGs
for fname in car_images:
    cars.append(fname)
for fname in extra_images:
    notcars.append(fname)
print("# of car images:{}".format(len(cars)))
print("# of non-car images:{}".format(len(notcars)))
# extract features from training images
img = cv2.imread(cars[0], cv2.IMREAD_GRAYSCALE)
car_features = extract_HOG_features(img, orient, pix_per_cell, cell_per_block)
print("car features shape: {}".format(car_features.shape))


### Explore

#### Explore Color Channels

Original Image

In [None]:
ystart, ystop = 380, 720
image = cv2.imread('./test_images/test1.jpg')
image = image[ystart:ystop,:]
image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
#
k=6
fig, (ax1) = plt.subplots(1, 1, figsize=(k*8, k*4), sharex=True, sharey=True)
ax1.axis('off')
ax1.imshow(image)
ax1.set_title('Original Image', fontsize=60)
ax1.set_adjustable('box-forced')
plt.show()

### HSV

In [None]:
image_HSV = cv2.cvtColor(image, cv2.COLOR_RGB2HSV)
k=6
fig, (ax1, ax2, ax3) = plt.subplots(3, 1, figsize=(k*8, k*4), sharex=True, sharey=True)
ax1.axis('off')
ax1.imshow(image_HSV[:,:,0], cmap='gray')
ax1.set_title('H', fontsize=60)
ax1.set_adjustable('box-forced')
#
ax2.axis('off')
ax2.imshow(image_HSV[:,:,1], cmap='gray')
ax2.set_title('S', fontsize=60)
ax2.set_adjustable('box-forced')
#
ax3.axis('off')
ax3.imshow(image_HSV[:,:,2], cmap='gray')
ax3.set_title('V', fontsize=60)
ax3.set_adjustable('box-forced')
plt.show()

### HLS

In [None]:
image_HLS = cv2.cvtColor(image, cv2.COLOR_RGB2HLS)
k=6
fig, (ax1, ax2, ax3) = plt.subplots(3, 1, figsize=(k*8, k*4), sharex=True, sharey=True)
ax1.axis('off')
ax1.imshow(image_HSV[:,:,0], cmap='gray')
ax1.set_title('H', fontsize=60)
ax1.set_adjustable('box-forced')
#
ax2.axis('off')
ax2.imshow(image_HSV[:,:,1], cmap='gray')
ax2.set_title('L', fontsize=60)
ax2.set_adjustable('box-forced')
#
ax3.axis('off')
ax3.imshow(image_HSV[:,:,2], cmap='gray')
ax3.set_title('S', fontsize=60)
ax3.set_adjustable('box-forced')
plt.show()

### LUV

In [None]:
image_LUV = cv2.cvtColor(image, cv2.COLOR_RGB2LUV)
k=6
fig, (ax1, ax2, ax3) = plt.subplots(3, 1, figsize=(k*8, k*4), sharex=True, sharey=True)
ax1.axis('off')
ax1.imshow(image_HSV[:,:,0], cmap='gray')
ax1.set_title('L', fontsize=60)
ax1.set_adjustable('box-forced')
#
ax2.axis('off')
ax2.imshow(image_HSV[:,:,1], cmap='gray')
ax2.set_title('U', fontsize=60)
ax2.set_adjustable('box-forced')
#
ax3.axis('off')
ax3.imshow(image_HSV[:,:,2], cmap='gray')
ax3.set_title('V', fontsize=60)
ax3.set_adjustable('box-forced')
plt.show()

### YUV

In [None]:
image_YUV = cv2.cvtColor(image, cv2.COLOR_RGB2YUV)
k=6
fig, (ax1, ax2, ax3) = plt.subplots(3, 1, figsize=(k*8, k*4), sharex=True, sharey=True)
ax1.axis('off')
ax1.imshow(image_HSV[:,:,0], cmap='gray')
ax1.set_title('Y', fontsize=60)
ax1.set_adjustable('box-forced')
#
ax2.axis('off')
ax2.imshow(image_HSV[:,:,1], cmap='gray')
ax2.set_title('U', fontsize=60)
ax2.set_adjustable('box-forced')
#
ax3.axis('off')
ax3.imshow(image_HSV[:,:,2], cmap='gray')
ax3.set_title('V', fontsize=60)
ax3.set_adjustable('box-forced')
plt.show()

### YCrCb

In [None]:
image_YCrCb = cv2.cvtColor(image, cv2.COLOR_RGB2YCrCb)
k=6
fig, (ax1, ax2, ax3) = plt.subplots(3, 1, figsize=(k*8, k*4), sharex=True, sharey=True)
ax1.axis('off')
ax1.imshow(image_HSV[:,:,0], cmap='gray')
ax1.set_title('Y', fontsize=60)
ax1.set_adjustable('box-forced')
#
ax2.axis('off')
ax2.imshow(image_HSV[:,:,1], cmap='gray')
ax2.set_title('Cr', fontsize=60)
ax2.set_adjustable('box-forced')
#
ax3.axis('off')
ax3.imshow(image_HSV[:,:,2], cmap='gray')
ax3.set_title('Cb', fontsize=60)
ax3.set_adjustable('box-forced')
plt.show()

### Train SVC

In [None]:
def convert_color(img, conv='RGB2YCrCb'):
    if conv == 'YCrCb':
        return cv2.cvtColor(img, cv2.COLOR_RGB2YCrCb)
    if conv == 'BGR2YCrCb':
        return cv2.cvtColor(img, cv2.COLOR_BGR2YCrCb)
    if conv == 'LUV':
        return cv2.cvtColor(img, cv2.COLOR_RGB2LUV)
    if conv == 'YUV':
        return cv2.cvtColor(img, cv2.COLOR_RGB2YUV)
    if conv == 'HSV':
        return cv2.cvtColor(img, cv2.COLOR_RGB2HSV)
    if conv == 'HLS':
        return cv2.cvtColor(img, cv2.COLOR_RGB2HLS)
    if conv == 'RGB':
        return img

def get_hog_features(img, orient, pix_per_cell, cell_per_block, 
                        vis=False, feature_vec=True):
    # Call with two outputs if vis==True
    if vis == True:
        features, hog_image = hog(img, orientations=orient, 
                                  pixels_per_cell=(pix_per_cell, pix_per_cell),
                                  cells_per_block=(cell_per_block, cell_per_block), 
                                  transform_sqrt=True, 
                                  visualise=vis, feature_vector=feature_vec)
        return features, hog_image
    # Otherwise call with one output
    else:      
        features = hog(img, orientations=orient, 
                       pixels_per_cell=(pix_per_cell, pix_per_cell),
                       cells_per_block=(cell_per_block, cell_per_block), 
                       transform_sqrt=True, 
                       visualise=vis, feature_vector=feature_vec)
        return features

# Define a function to compute binned color features  
def bin_spatial(img, size=(32, 32)):
    # Use cv2.resize().ravel() to create the feature vector
    features = cv2.resize(img, size).ravel() 
    # Return the feature vector
    return features

# Define a function to compute color histogram features 
# NEED TO CHANGE bins_range if reading .png files with mpimg!
def color_hist(img, nbins=32, bins_range=(0, 256)):
    # Compute the histogram of the color channels separately
    channel1_hist = np.histogram(img[:,:,0], bins=nbins, range=bins_range)
    channel2_hist = np.histogram(img[:,:,1], bins=nbins, range=bins_range)
    channel3_hist = np.histogram(img[:,:,2], bins=nbins, range=bins_range)
    # Concatenate the histograms into a single feature vector
    hist_features = np.concatenate((channel1_hist[0], channel2_hist[0], channel3_hist[0]))
    # Return the individual histograms, bin_centers and feature vector
    return hist_features

# Define a function to extract features from a list of images
# Have this function call bin_spatial() and color_hist()
def extract_features(imgs, color_channels=[None, None, None],
                     spatial_size=(32, 32),
                     hist_bins=32, orient=9,
                     pix_per_cell=8, cell_per_block=2, hog_channel=0,
                     spatial_feat=True, hist_feat=True, hog_feat=True):
    # Create a list to append feature vectors to
    features = []
    # Iterate through the list of images
    for file in imgs:
        file_features = []
        # Read in each one by one
        image = cv2.imread(file)
        # apply color conversion if other than 'RGB'
        if color_space != 'RGB':
            if color_space == 'HSV':
                feature_image = cv2.cvtColor(image, cv2.COLOR_RGB2HSV)
            elif color_space == 'LUV':
                feature_image = cv2.cvtColor(image, cv2.COLOR_RGB2LUV)
            elif color_space == 'HLS':
                feature_image = cv2.cvtColor(image, cv2.COLOR_RGB2HLS)
            elif color_space == 'YUV':
                feature_image = cv2.cvtColor(image, cv2.COLOR_RGB2YUV)
            elif color_space == 'YCrCb':
                feature_image = cv2.cvtColor(image, cv2.COLOR_RGB2YCrCb)
        else: feature_image = np.copy(image)
        
        if spatial_feat == True:
            spatial_features = bin_spatial(feature_image, size=spatial_size)
            file_features.append(spatial_features)
        if hist_feat == True:
            # Apply color_hist()
            hist_features = color_hist(feature_image, nbins=hist_bins)
            file_features.append(hist_features)
        if hog_feat == True:
        # Call get_hog_features() with vis=False, feature_vec=True
            if hog_channel == 'ALL':
                hog_features = []
                for channel in range(feature_image.shape[2]):
                    hog_features.append(get_hog_features(feature_image[:,:,channel], 
                                        orient, pix_per_cell, cell_per_block, 
                                        vis=False, feature_vec=True))
                hog_features = np.ravel(hog_features)        
            else:
                hog_features = get_hog_features(feature_image[:,:,hog_channel], orient, 
                            pix_per_cell, cell_per_block, vis=False, feature_vec=True)
            # Append the new feature vector to the features list
            file_features.append(hog_features)
        features.append(np.concatenate(file_features))
    # Return list of feature vectors
    return features

In [None]:
from sklearn.svm import LinearSVC

def train_SVC(color_space='YCrCb', # Can be RGB, HSV, LUV, HLS, YUV, YCrCb
              orient=9,  # HOG orientations
              pix_per_cell=8, # HOG pixels per cell
              cell_per_block=2, # HOG cells per block
              hog_channel='ALL', # Can be 0, 1, 2, or "ALL"
              spatial_size=(16, 16), # Spatial binning dimensions
              hist_bins=16,    # Number of histogram bins
              spatial_feat=True, # Spatial features on or off
              hist_feat=True, # Histogram features on or off
              hog_feat=True, # HOG features on or off
              cost=0.1 # Penalty parameter for error term of LinearSVC()
             ):
        
    ### images are PNGs
    extra_images = glob.glob('./non-vehicles/Extras/*.png')
    extra_images.extend(glob.glob('./non-vehicles/GTI/*.png'))
    
    car_images = glob.glob('./vehicles/KITTI_extracted/*.png')
    car_images.extend(glob.glob('./vehicles/GTI_Right/*.png'))
    car_images.extend(glob.glob('./vehicles/GTI_MiddleClose/*.png'))
    car_images.extend(glob.glob('./vehicles/GTI_Far/*.png'))
    car_images.extend(glob.glob('./vehicles/GTI_Left/*.png'))
    cars = []
    notcars = []
    for img in extra_images:
        notcars.append(img)
    for img in car_images:
        cars.append(img)
    print("# of car images:{}".format(len(cars)))
    print("# of non-car images:{}".format(len(notcars)))
    
    # extract features from training images
    car_features = extract_features(cars, color_space, spatial_size, hist_bins, orient, pix_per_cell, 
                        cell_per_block, hog_channel, spatial_feat, hist_feat, hog_feat)
    notcar_features = extract_features(notcars, color_space, spatial_size, hist_bins, orient, pix_per_cell, 
                        cell_per_block, hog_channel, spatial_feat, hist_feat, hog_feat)
    #
    X = np.vstack((car_features, notcar_features)).astype(np.float64)                        
    # Fit a per-column scaler
    X_scaler = StandardScaler().fit(X)
    # Apply the scaler to X
    scaled_X = X_scaler.transform(X)
    y = np.hstack((np.ones(len(car_features)), np.zeros(len(notcar_features))))

    rand_state = 42
    # split
    X_train, X_test, y_train, y_test = train_test_split(
        scaled_X, y, test_size=0.30, random_state=rand_state)
    #
    print('Using:',orient,'orientations',pix_per_cell,
        'pixels per cell and', cell_per_block,'cells per block')
    print('Feature vector length:', len(X_train[0]))
    # Use a linear SVC 
    svc = LinearSVC(C=cost)
    # Check the training time for the SVC
    t=time.time()
    svc.fit(X_train, y_train)
    t2 = time.time()
    print(round(t2-t, 2), 'Seconds to train SVC...')
    # Check the score of the SVC
    print('Test Accuracy of SVC = ', round(svc.score(X_test, y_test), 4))
    # Check the prediction time for a single sample
    t=time.time()
    return svc, X_scaler

In [None]:
# Define a single function that can extract features using hog sub-sampling and make predictions
def find_cars(img, search_box, scale,
              svc, X_scaler,
              orient, pix_per_cell, cell_per_block,
              spatial_size, hist_bins,
              cells_per_step=2, color_conv='YCrCb'):
    
    xstart, xstop = search_box[0], search_box[2]
    ystart, ystop = search_box[1], search_box[3]
    
    img_tosearch = img[ystart:ystop,xstart:xstop,:]    
    bbox_list = []
    
    if color_conv != 'RGB':
        ctrans_tosearch = convert_color(img_tosearch, conv=color_conv)
    else:
        ctrans_tosearch = img_tosearch
    if scale != 1:
        imshape = ctrans_tosearch.shape
        ctrans_tosearch = cv2.resize(ctrans_tosearch, (np.int(imshape[1]/scale), np.int(imshape[0]/scale)))
    
    ch1 = ctrans_tosearch[:,:,0]
    ch2 = ctrans_tosearch[:,:,1]
    ch3 = ctrans_tosearch[:,:,2]

    # Define blocks and steps as above
    nxblocks = (ch1.shape[1] // pix_per_cell) - cell_per_block + 1
    nyblocks = (ch1.shape[0] // pix_per_cell) - cell_per_block + 1 
    nfeat_per_block = orient*cell_per_block**2
    
    # 64 was the orginal sampling rate, with 8 cells and 8 pix per cell
    window = 64
    nblocks_per_window = (window // pix_per_cell) - cell_per_block + 1
    nxsteps = (nxblocks - nblocks_per_window) // cells_per_step
    nysteps = (nyblocks - nblocks_per_window) // cells_per_step
    
    # Compute individual channel HOG features for the entire image
    hog1 = get_hog_features(ch1, orient, pix_per_cell, cell_per_block, feature_vec=False)
    hog2 = get_hog_features(ch2, orient, pix_per_cell, cell_per_block, feature_vec=False)
    hog3 = get_hog_features(ch3, orient, pix_per_cell, cell_per_block, feature_vec=False)
    
    for xb in range(nxsteps):
        for yb in range(nysteps):
            ypos = yb*cells_per_step
            xpos = xb*cells_per_step
            # Extract HOG for this patch
            hog_feat1 = hog1[ypos:ypos+nblocks_per_window, xpos:xpos+nblocks_per_window].ravel() 
            hog_feat2 = hog2[ypos:ypos+nblocks_per_window, xpos:xpos+nblocks_per_window].ravel() 
            hog_feat3 = hog3[ypos:ypos+nblocks_per_window, xpos:xpos+nblocks_per_window].ravel() 
            hog_features = np.hstack((hog_feat1, hog_feat2, hog_feat3))

            xleft = xpos*pix_per_cell
            ytop = ypos*pix_per_cell

            # Extract the image patch
            subimg = cv2.resize(ctrans_tosearch[ytop:ytop+window, xleft:xleft+window], (64,64))
          
            # Get color features
            spatial_features = bin_spatial(subimg, size=spatial_size)
            hist_features = color_hist(subimg, nbins=hist_bins)

            # Scale features and make a prediction
            test_features = X_scaler.transform(np.hstack((spatial_features, hist_features, hog_features)).reshape(1, -1))    
            #test_features = X_scaler.transform(np.hstack((shape_feat, hist_feat)).reshape(1, -1))    
            test_prediction = svc.predict(test_features)
            
            if test_prediction == 1:
                xbox_left = np.int(xleft*scale)
                ytop_draw = np.int(ytop*scale)
                win_draw = np.int(window*scale)
                bbox_list.append([(xbox_left+xstart, ytop_draw+ystart), (xbox_left+win_draw+xstart,ytop_draw+win_draw+ystart)])
                #cv2.rectangle(draw_img,(xbox_left, ytop_draw+ystart),(xbox_left+win_draw,ytop_draw+win_draw+ystart),(0,0,255),6) 
                
    return bbox_list

In [None]:
def add_heat(img, bbox_list):
    heatmap = np.zeros_like(image[:,:,0])
    # Iterate through list of bboxes
    for box in bbox_list:
        # Add += 1 for all pixels inside each bbox
        # Assuming each "box" takes the form ((x1, y1), (x2, y2))
        heatmap[box[0][1]:box[1][1], box[0][0]:box[1][0]] += 1

    # Return updated heatmap
    return heatmap

def apply_threshold(heatmap, threshold=2):
    # Zero out pixels below the threshold
    heatmap[heatmap <= threshold] = 0
    # Return thresholded map
    return heatmap

from scipy.ndimage.measurements import label
def get_labels(heatmap):
    labels = label(heatmap)
    return labels

def draw_labeled_bboxes(img, labels):
    draw_img = np.copy(img)
    # Iterate through all detected cars
    for car_number in range(1, labels[1]+1):
        # Find pixels with each car_number label value
        nonzero = (labels[0] == car_number).nonzero()
        # Identify x and y values of those pixels
        nonzeroy = np.array(nonzero[0])
        nonzerox = np.array(nonzero[1])
        # Define a bounding box based on min/max x and y
        bbox = ((np.min(nonzerox), np.min(nonzeroy)), (np.max(nonzerox), np.max(nonzeroy)))
        # Draw the box on the image
        cv2.rectangle(draw_img, bbox[0], bbox[1], (0,0,255), 3)
    # Return the image
    return draw_img

In [None]:
image = cv2.imread('./test_images/test3.jpg')
image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
image_conv = convert_color(image, conv=color_space)
#
scales = [ 0.75]
bbox_list = []
cells_per_step = 1
for scale in scales:
    search_box = get_search_window(scale)
    bbox_list.extend(find_cars(image_conv, search_box, scale, svc, X_scaler,
                  orient, pix_per_cell, cell_per_block,
                  spatial_size, hist_bins,
                  cells_per_step, color_space))
print(len(bbox_list))
heatmap = add_heat(image, bbox_list)
heatmap = apply_threshold(heatmap, threshold=3)
labels = get_labels(heatmap)
detected_img = draw_labeled_bboxes(image, labels)
#
k=10
fig, (ax1, ax2, ax3) = plt.subplots(1, 3, figsize=(k*1.78, k), sharex=True, sharey=True)
ax1.axis('off')
ax1.imshow(image)
ax1.set_title('Original', fontsize=20)
ax1.set_adjustable('box-forced')
#
ax2.axis('off')
ax2.imshow(heatmap, cmap='gray')
ax2.set_title('Heatmap', fontsize=20)
ax2.set_adjustable('box-forced')
#
ax3.axis('off')
ax3.imshow(detected_img)
ax3.set_title('Heatmap', fontsize=20)
ax3.set_adjustable('box-forced')

#draw_img = np.copy(image)
#for box in bbox_list:
#    cv2.rectangle(draw_img, box[0], box[1], (0,0,255), 3)
#plt.imshow(draw_img)

## Pipeline

In [None]:
def get_search_window(scale):
    #return [600, 440, 1280, 680]
    # search window format: [xtart, ystart, xstop, ystop]
    if scale<=0.5:
        return [500, 425, 1280, 450]
    if scale<=1.0:
        return [500, 400, 1280, 550]
    if scale<=1.5:
        return [500, 425, 1280, 575]
    if scale<=2.0:
        return [525, 500, 1280, 625]
    if scale<=2.5:
        return [525, 550, 1280, 720]
    else:# scale<=3.0:
        return [525, 450, 1280, 720]
    

In [None]:
cost = 0.1
color_space='YCrCb' # Can be RGB, HSV, LUV, HLS, YUV, YCrCb
#
hog_feat=True
orient=9
pix_per_cell=16
cell_per_block=2
hog_channel='ALL'
#
spatial_feat=True # Spatial features on or off
spatial_size=(8*2, 8*2)
#
hist_feat=True # Histogram (color) features on or off
hist_bins=16*2   # Number of histogram bins
#
print("Using {} color space.".format(color_space))
svc, X_scaler = train_SVC(color_space, 
                          orient,  # HOG orientations
                          pix_per_cell, # HOG pixels per cell
                          cell_per_block, # HOG cells per block
                          hog_channel, # Can be 0, 1, 2, or "ALL"
                          spatial_size, # Spatial binning dimensions
                          hist_bins,    # Number of histogram bins
                          spatial_feat, # Spatial features on or off
                          hist_feat, # Histogram features on or off
                          hog_feat, # HOG features on or off
                          cost # Penalty parameter for error term of LinearSVC()
                         )


In [None]:
scales = [0.5, 1.0, 1.5, 2.0, 3.0]
cells_per_step = 2
heatmap_thresh = 2
#
def vehicle_detection_pipeline(img):
    # 1 - Input frame is RGB image 1280 x 720 (x,y)
    bbox_list = []
    for scale in scales:
        search_box = get_search_window(scale)
        bbox_list.extend(find_cars(img, search_box, scale, svc, X_scaler,
                      orient, pix_per_cell, cell_per_block,
                      spatial_size, hist_bins,
                      cells_per_step, color_space))
    # 2 - Create heatmap using found bounding boxes
    heatmap = add_heat(img, bbox_list)
    heatmap = apply_threshold(heatmap, heatmap_thresh)
    # 3 - Create labels and find appropriate bounding box
    labels = get_labels(heatmap)
    detected_img = draw_labeled_bboxes(img, labels)
    #draw_img = np.copy(img)
    #for box in bbox_list:
    #    cv2.rectangle(draw_img, box[0], box[1], (0,0,255), 3)
    #return draw_img
    return detected_img
#
from moviepy.editor import VideoFileClip
from IPython.display import HTML
#
input_clip = './project_video.mp4'
clip = VideoFileClip(input_clip).subclip(5,25)
output_clip = './project_video_output.mp4'
output = clip.fl_image(vehicle_detection_pipeline)
%time output.write_videofile(output_clip, audio=False)

In [None]:
HTML("""
<video width="960" height="540" controls>
<source src="{0}"> </video>
""".format(output_clip))