## Advanced Lane Finding Project

The goals / steps of this project are the following:

* Compute the camera calibration matrix and distortion coefficients given a set of chessboard images.
* Apply a distortion correction to raw images.
* Use color transforms, gradients, etc., to create a thresholded binary image.
* Apply a perspective transform to rectify binary image ("birds-eye view").
* Detect lane pixels and fit to find the lane boundary.
* Determine the curvature of the lane and vehicle position with respect to center.
* Warp the detected lane boundaries back onto the original image.
* Output visual display of the lane boundaries and numerical estimation of lane curvature and vehicle position.

---
## First, I'll compute the camera calibration using chessboard images

In [1]:
import numpy as np
import cv2
import glob
import matplotlib.pyplot as plt
%matplotlib qt

# prepare object points, like (0,0,0), (1,0,0), (2,0,0) ....,(6,5,0)
objp = np.zeros((6*9,3), np.float32)
objp[:,:2] = np.mgrid[0:9,0:6].T.reshape(-1,2)

# Arrays to store object points and image points from all the images.
objpoints = [] # 3d points in real world space
imgpoints = [] # 2d points in image plane.

# Make a list of calibration images
images = glob.glob('../camera_cal/calibration*.jpg')

# Step through the list and search for chessboard corners
for fname in images:
    img = cv2.imread(fname)
    gray = cv2.cvtColor(img,cv2.COLOR_BGR2GRAY)

    # Find the chessboard corners
    ret, corners = cv2.findChessboardCorners(gray, (9,6),None)

    # If found, add object points, image points
    if ret == True:
        objpoints.append(objp)
        imgpoints.append(corners)

        # Draw and display the corners
        img = cv2.drawChessboardCorners(img, (9,6), corners, ret)
        cv2.imshow('img',img)
        cv2.waitKey(500)

cv2.destroyAllWindows()

## And so on and so forth...

In [2]:
# calibrate camera
ret, mtx, dist, rvecs, tvecs = cv2.calibrateCamera(objpoints, imgpoints, gray.shape[::-1], None, None)

In [3]:
import os
test_images = glob.glob('../test_images/*.jpg')

In [13]:
# undistort the test images
for fname in test_images:
    img = cv2.imread(fname)
    gray = cv2.cvtColor(img,cv2.COLOR_BGR2GRAY)
    if ret:
        cal_img = cv2.undistort(img, mtx, dist, None, mtx)
    else:
        print(fname, 'has a problem with calibration')
        cal_img = img.copy()
    cv2.imwrite(os.path.join('../output_images', 'cal_img_' + os.path.basename(fname)), cal_img)

In [18]:
cal_images = glob.glob('../output_images/cal_img_straight*.jpg') + glob.glob('../output_images/cal_img_test*.jpg')
for fname in cal_images:
    img = cv2.imread(fname)
    gray = cv2.cvtColor(img,cv2.COLOR_BGR2GRAY)    
    mag_threshold = (60, 255)
    R_threshold = (70, 255)
    S_threshold = (100, 255)  # more flexible
    #gaussian_k = 5
    #gray = cv2.GaussianBlur(gray, (gaussian_k, gaussian_k), 0)
    
    # magnitude of sobel operator
    sobelx = cv2.Sobel(gray, cv2.CV_64F, 1, 0, ksize=3)
    sobely = cv2.Sobel(gray, cv2.CV_64F, 0, 1, ksize=3)
    
    mag_sobel = np.sqrt(sobelx**2 + sobely**2)
    grad_dire = np.arctan2(abs(sobely), abs(sobelx))  # not good result
    abs_sobel = np.absolute(mag_sobel)
    scaled_sobel = np.uint8(255*abs_sobel/np.max(abs_sobel))
    smag_bin_img = np.zeros_like(abs_sobel)
    smag_bin_img[(scaled_sobel >= mag_threshold[0]) & (scaled_sobel <= mag_threshold[1])] = 255
    
    # r-channel of BGR color space
    R = img[:, :, 2]
    sobelx_R = cv2.Sobel(gray, cv2.CV_64F, 1, 0, ksize=3)
    abs_sobel = np.absolute(sobelx_R)
    scaled_sobel = np.uint8(255*abs_sobel/np.max(abs_sobel))
    R_bin_img = np.zeros_like(R)
    R_bin_img[(scaled_sobel >= R_threshold[0]) & (scaled_sobel <= R_threshold[1])] = 255
    
    # s-channel of HLS color space
    hls = cv2.cvtColor(img, cv2.COLOR_BGR2HLS)
    S = hls[:, :, 2]
    S_bin_img = np.zeros_like(S)
    S_bin_img[(S >= S_threshold[0]) & (S <= S_threshold[1])] = 255
    
    # stack channels and combine them to one binary image
    stacked_bin_img = np.dstack((smag_bin_img, S_bin_img, S_bin_img))
    combined_bin_img = np.zeros_like(abs_sobel)
    combined_bin_img[(smag_bin_img == 255) | (S_bin_img == 255)] = 255
    
    cv2.imwrite(os.path.join('../output_images', os.path.basename(fname).replace('cal_img', 'mag_S_thresholded')), combined_bin_img)
    #cv2.imshow('binary_img', stacked_bin_img)
    #cv2.waitKey(1500)

cv2.destroyAllWindows()

In [13]:
bin_images = glob.glob('../output_images/mag_S_thresholded*.jpg')
label_img_coords = [[573, 467], [709, 467], [1007, 667], [293, 667]]  # order
offset_x = 300
offset_y = 0

for fname in bin_images:
    img = cv2.imread(fname)
    img_size = img.shape[1::-1]
    topdown_coords = [[offset_x, offset_y], [img_size[0] - offset_x, offset_y], 
                      [img_size[0] - offset_x, img_size[1] - offset_y], [offset_x, img_size[1] - offset_y]]
    src_pts = np.float32(label_img_coords)
    dst_pts = np.float32(topdown_coords)
    pt_mtx = cv2.getPerspectiveTransform(src_pts, dst_pts)
    
    warped_img = cv2.warpPerspective(img, pt_mtx, img_size, flags=cv2.INTER_NEAREST)  #LINEAR)  #INTER_NEAREST
    
    #cv2.imwrite(os.path.join('../output_images', os.path.basename(fname).replace('mag_S_thresholded', 'warped_bin')), warped_img)
    cv2.imshow('warped_img', warped_img)
    cv2.waitKey(500)
    
cv2.destroyAllWindows()

In [49]:
# Two functions just copied from my exercise
def find_lane_pixels(binary_warped):
    # Take a histogram of the bottom half of the image
    histogram = np.sum(binary_warped[binary_warped.shape[0]//2:,:], axis=0)
    # Create an output image to draw on and visualize the result
    out_img = np.dstack((binary_warped, binary_warped, binary_warped))
    # Find the peak of the left and right halves of the histogram
    # These will be the starting point for the left and right lines
    midpoint = np.int(histogram.shape[0]//2)
    leftx_base = np.argmax(histogram[:midpoint])
    rightx_base = np.argmax(histogram[midpoint:]) + midpoint

    # HYPERPARAMETERS
    # Choose the number of sliding windows
    nwindows = 9
    # Set the width of the windows +/- margin
    margin = 100
    # Set minimum number of pixels found to recenter window
    minpix = 50

    # Set height of windows - based on nwindows above and image shape
    window_height = np.int(binary_warped.shape[0]//nwindows)
    # Identify the x and y positions of all nonzero pixels in the image
    nonzero = binary_warped.nonzero()
    nonzeroy = np.array(nonzero[0])
    nonzerox = np.array(nonzero[1])
    # Current positions to be updated later for each window in nwindows
    leftx_current = leftx_base
    rightx_current = rightx_base

    # Create empty lists to receive left and right lane pixel indices
    left_lane_inds = []
    right_lane_inds = []

    # Step through the windows one by one
    for window in range(nwindows):
        # Identify window boundaries in x and y (and right and left)
        win_y_low = binary_warped.shape[0] - (window+1)*window_height
        win_y_high = binary_warped.shape[0] - window*window_height
        ### TO-DO: Find the four below boundaries of the window ###
        win_xleft_low = leftx_current - margin  # Update this
        win_xleft_high = leftx_current + margin  # Update this
        win_xright_low = rightx_current - margin  # Update this
        win_xright_high = rightx_current + margin  # Update this
        # what if they are out of image scale
        
        # Draw the windows on the visualization image, comment them if re-projecting relevant points back to cal image
        #cv2.rectangle(out_img,(win_xleft_low,win_y_low), (win_xleft_high,win_y_high),(0,255,0), 2)
        #cv2.rectangle(out_img,(win_xright_low,win_y_low),(win_xright_high,win_y_high),(0,255,0), 2) 
        
        ### Identify the nonzero pixels in x and y within the window ###
        good_left_inds = ((win_y_low <= nonzeroy) &
                          (nonzeroy < win_y_high) &
                          (win_xleft_low <= nonzerox) &
                          (nonzerox < win_xleft_high)).nonzero()[0]
        good_right_inds = ((win_y_low <= nonzeroy) &
                           (nonzeroy < win_y_high) &
                           (win_xright_low <= nonzerox) &
                           (nonzerox < win_xright_high)).nonzero()[0]
        #print(good_left_inds)
        # Append these indices to the lists
        left_lane_inds.append(good_left_inds)
        right_lane_inds.append(good_right_inds)
        
        ### If you found > minpix pixels, recenter next window ###
        ### (`right` or `leftx_current`) on their mean position ###
        if len(good_left_inds) > minpix:
            leftx_current = int(np.mean(nonzerox[good_left_inds]))
        if len(good_right_inds) > minpix:
            rightx_current = int(np.mean(nonzerox[good_right_inds]))

    # Concatenate the arrays of indices (previously was a list of lists of pixels)
    try:
        left_lane_inds = np.concatenate(left_lane_inds)
        right_lane_inds = np.concatenate(right_lane_inds)
    except ValueError:
        # Avoids an error if the above is not implemented fully
        pass

    # Extract left and right line pixel positions
    leftx = nonzerox[left_lane_inds] # Should lane_inds be 1-dim or 2-dim?
    lefty = nonzeroy[left_lane_inds] 
    rightx = nonzerox[right_lane_inds]
    righty = nonzeroy[right_lane_inds]

    return leftx, lefty, rightx, righty, out_img


def fit_polynomial(binary_warped):
    # Find our lane pixels first
    leftx, lefty, rightx, righty, out_img = find_lane_pixels(binary_warped)

    # Fit a second order polynomial to each using `np.polyfit`
    left_fit = np.polyfit(lefty, leftx, 2)
    right_fit = np.polyfit(righty, rightx, 2)

    # Generate x and y values for plotting
    ploty = np.linspace(0, binary_warped.shape[0]-1, binary_warped.shape[0] )
    try:
        left_fitx = left_fit[0]*ploty**2 + left_fit[1]*ploty + left_fit[2]
        right_fitx = right_fit[0]*ploty**2 + right_fit[1]*ploty + right_fit[2]
    except TypeError:
        # Avoids an error if `left` and `right_fit` are still none or incorrect
        print('The function failed to fit a line!')
        left_fitx = 1*ploty**2 + 1*ploty
        right_fitx = 1*ploty**2 + 1*ploty

    ## Visualization ##
    # first reset all detected points to black
    out_img[::1] = [0, 0, 0]
    
    # set the freespace as green
    for i_y in ploty:
        out_img[i_y.astype(int), (left_fitx[i_y.astype(int)].astype(int)):(right_fitx[i_y.astype(int)].astype(int))] = [0, 255, 0]
    
    # Colors in the left and right lane regions
    out_img[lefty, leftx] = [0, 0, 255]
    out_img[righty, rightx] = [255, 0, 0]    
        
    # Plots the left and right polynomials on the lane lines
    #plt.plot(left_fitx, ploty, color='yellow')
    #plt.plot(right_fitx, ploty, color='yellow')

    # set the color value for pixels on the polynomial instead of plotting them in another figure
    out_img[ploty.astype(int), left_fitx.astype(int)] = [0, 255, 255]
    out_img[ploty.astype(int), right_fitx.astype(int)] = [0, 255, 255]
            
    ## Curvature Radius ##
    ym_per_pix = 20.809 / 720 # meters per pixel in y dimension
    xm_per_pix = 3.7 / 680 # meters per pixel in x dimension
    
    left_fit_cr = np.polyfit(lefty*ym_per_pix, leftx*xm_per_pix, 2)
    right_fit_cr = np.polyfit(righty*ym_per_pix, rightx*xm_per_pix, 2)
    
    y_eval = np.max(ploty*ym_per_pix)
    left_curverad = (1 + (2*left_fit_cr[0]*y_eval + left_fit_cr[1])**2)**1.5 / np.absolute(2*left_fit_cr[0])
    right_curverad = (1 + (2*right_fit_cr[0]*y_eval + right_fit_cr[1])**2)**1.5 / np.absolute(2*right_fit_cr[0])
    
    mean_curverad = (len(leftx)*left_curverad + len(rightx)*right_curverad) / (len(leftx) + len(rightx))
    
    return out_img, mean_curverad  # (left_curverad, right_curverad)

In [51]:
warped_bin_images = glob.glob('../output_images/warped_bin*.jpg')

for fname in warped_bin_images:
    img = cv2.imread(fname)
    gray_img = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
    overlay_img, curve_rad = fit_polynomial(gray_img)
    
    cv2.imwrite(os.path.join('../output_images', os.path.basename(fname).replace('warped_bin', 'patch_bin')), overlay_img)
    #cv2.imshow('fitted_polynomial', overlay_img)
    #cv2.waitKey(500)
    #print(curve_rad)
    
cv2.destroyAllWindows()

In [9]:
label_img_coords = [[573, 467], [709, 467], [1007, 667], [293, 667]]

def coordTransfrom(img_coord):
    xd = (img_coord[0] - mtx[0,2]) / mtx[0,0]
    yd = (img_coord[1] - mtx[1,2]) / mtx[1,1]
    cam_coord_vec = np.array([[xd], [yd], [1]])
    rtx = np.matrix([[0, -1,  0],
                     [0,  0, -1],
                     [1,  0,  0]])
    cam_height = 2.05  # guess a value, which makes you get a reasonable y-estimation to compare with lane width
    ret_vec = rtx.T*cam_coord_vec
    
    if ret_vec[2, 0] != 0:
        cz = -cam_height / ret_vec[2, 0]
        return tuple([ret_vec[0, 0] * cz, ret_vec[1, 0] * cz, 0])
    else:
        print(ret_vec)
        return None

print('length')
print(coordTransfrom(label_img_coords[0])[0] - coordTransfrom(label_img_coords[3])[0])
print(coordTransfrom(label_img_coords[1])[0] - coordTransfrom(label_img_coords[2])[0])
print('width')
print(coordTransfrom(label_img_coords[0])[1] - coordTransfrom(label_img_coords[1])[1])
print(coordTransfrom(label_img_coords[3])[1] - coordTransfrom(label_img_coords[2])[1])

length
20.808765221287736
20.808765221287736
width
3.4327046567787898
5.188978777062997


In [18]:
def weighted_img(img, initial_img, α=0.8, β=1., γ=0.):
    """
    `img` is the output of the hough_lines(), An image with lines drawn on it.
    Should be a blank image (all black) with lines drawn on it.
    
    `initial_img` should be the image before any processing.
    
    The result image is computed as follows:
    
    initial_img * α + img * β + γ
    NOTE: initial_img and img must be the same shape!
    """
    return cv2.addWeighted(initial_img, α, img, β, γ)

In [53]:
fitted_bin_images = glob.glob('../output_images/patch_bin*.jpg')

for fname in fitted_bin_images:
    img = cv2.imread(fname)
    img_size = img.shape[1::-1]
    topdown_coords = [[offset_x, offset_y], [img_size[0] - offset_x, offset_y], 
                      [img_size[0] - offset_x, img_size[1] - offset_y], [offset_x, img_size[1] - offset_y]]
    src_pts = np.float32(label_img_coords)
    dst_pts = np.float32(topdown_coords)
    pt_minv = cv2.getPerspectiveTransform(dst_pts, src_pts)
    
    rectified_img = cv2.warpPerspective(img, pt_minv, img_size, flags=cv2.INTER_LINEAR)  #INTER_NEAREST
    
    cal_img = cv2.imread(fname.replace('patch_bin', 'cal_img'))
    rectified_img = weighted_img(rectified_img, cal_img)
    
    #cv2.imwrite(os.path.join('../output_images', os.path.basename(fname).replace('mag_S_thresholded', 'warped_bin')), warped_img)
    cv2.imshow('rectified_img', rectified_img)
    cv2.waitKey(1500)
    
cv2.destroyAllWindows()