In [1]:
import numpy as np
import cv2
import matplotlib.pyplot as plt
import matplotlib.image as mpimg
import glob
from moviepy.editor import VideoFileClip
from IPython.display import HTML

In [2]:
def calib_distort(calib_images):
    
    objpoints = []
    imgpoints = []

    objp = np.zeros((6*9,3),np.float32)
    objp[:,:2] = np.mgrid[0:9,0:6].T.reshape(-1,2)

    for fname in calib_images:
        img = mpimg.imread(fname)

        gray = cv2.cvtColor(img,cv2.COLOR_BGR2GRAY)

        ret, corners = cv2.findChessboardCorners(gray, (9,6), None)

        if ret == True:
            imgpoints.append(corners)
            objpoints.append(objp)

    ret, mtx, dist, rvecs, tvecs = cv2.calibrateCamera(objpoints, imgpoints, gray.shape[::-1], None, None)
    
    return mtx, dist

In [3]:
def abs_sobel_thresh(img, orient='x', sobel_kernel=3, thresh=(0, 255)):

    # 1) Convert to grayscale
    gray = cv2.cvtColor(img, cv2.COLOR_RGB2GRAY)
    
    # 2) Take the derivative in x or y given orient = 'x' or 'y'
    if orient=='x':
        sobel = cv2.Sobel(gray, cv2.CV_64F, 1, 0, ksize=sobel_kernel)
    else:
        sobel = cv2.Sobel(gray, cv2.CV_64F, 0, 1, ksize=sobel_kernel)
        
    # 3) Take the absolute value of the derivative or gradient
    abs_sobel = np.absolute(sobel)
    
    # 4) Scale to 8-bit (0 - 255) then convert to type = np.uint8
    scaled_sobel = np.uint8(255*abs_sobel/np.max(abs_sobel))
    
    # 5) Create a mask of 1's where the scaled gradient magnitude is > thresh_min and < thresh_max
    grad_binary = np.zeros_like(scaled_sobel)
    grad_binary[(scaled_sobel >= thresh[0]) & (scaled_sobel <= thresh[1])] = 1
    
    return grad_binary

In [4]:
def mag_thresh(image, sobel_kernel=3, mag_thresh=(20, 100)):
    
    # 1) Convert to grayscale
    gray = cv2.cvtColor(image, cv2.COLOR_RGB2GRAY)
    
    # 2) Take the gradient in x and y separately
    sobelx = cv2.Sobel(gray, cv2.CV_64F, 1, 0, ksize=sobel_kernel)
    sobely = cv2.Sobel(gray, cv2.CV_64F, 0, 1, ksize=sobel_kernel)
    
    # 3) Calculate the magnitude 
    mag_sobel = np.sqrt(np.square(sobelx) + np.square(sobely))
    
    # 4) Scale to 8-bit (0 - 255) and convert to type = np.uint8
    scaled_sobel = np.uint8(255*mag_sobel/np.max(mag_sobel))
    
    # 5) Create a binary mask where mag thresholds are met
    mag_binary = np.zeros_like(scaled_sobel)
    mag_binary[(scaled_sobel >= mag_thresh[0]) & (scaled_sobel <= mag_thresh[1])] = 1
    
    return mag_binary

In [5]:
def dir_threshold(image, sobel_kernel=3, thresh=(0, np.pi/2)):
    
    # 1) Convert to grayscale
    gray = cv2.cvtColor(image, cv2.COLOR_RGB2GRAY)
    
    # 2) Take the gradient in x and y separately
    sobelx = cv2.Sobel(gray, cv2.CV_64F, 1, 0, ksize=sobel_kernel)
    sobely = cv2.Sobel(gray, cv2.CV_64F, 0, 1, ksize=sobel_kernel)
    
    # 3) Take the absolute value of the x and y gradients
    abs_sobelx = np.absolute(sobelx)
    abs_sobely = np.absolute(sobely)
    
    # 4) Use np.arctan2(abs_sobely, abs_sobelx) to calculate the direction of the gradient 
    direction = np.arctan2(abs_sobely, abs_sobelx)
    
    # 5) Create a binary mask where direction thresholds are met
    dir_binary = np.zeros_like(direction)
    dir_binary[(direction >= thresh[0]) & (direction <= thresh[1])] = 1
    
    return dir_binary

In [6]:
def hls_thresh(image, ctype = 'S' ,thresh=(0, 255)):
    
    # 1) Convert to HLS color space
    hls = cv2.cvtColor(image, cv2.COLOR_RGB2HLS)
    
    # 2) Apply a threshold to the S channel
    S = hls[:,:,2]
    L = hls[:,:,1]
    if ctype == 'S':
        binary_output = np.zeros_like(S)
        binary_output[(S > thresh[0]) & (S <= thresh[1])] = 1
    else :
        binary_output = np.zeros_like(L)
        binary_output[(L > thresh[0]) & (L <= thresh[1])] = 1 
    return binary_output

In [7]:
def wrap(image):
    
    img_size = (image.shape[1], image.shape[0])

    src = np.float32(
        [[580, 460],
         [205, 720],
         [1110, 720],
         [703, 460]])
    
    dst = np.float32(
        [[320, 0],
         [320, 720],
         [960, 720],
         [960, 0]])
    
    M = cv2.getPerspectiveTransform(src, dst)
    Minv = cv2.getPerspectiveTransform(dst, src)
    warped = cv2.warpPerspective(image, M, img_size, flags=cv2.INTER_LINEAR)
    
    return warped, Minv

In [8]:
def find_lane_pixels(binary_warped):
    # Take a histogram of the bottom half of the image
    histogram = np.sum(binary_warped[binary_warped.shape[0]//2:,:], axis=0)
    # Create an output image to draw on and visualize the result
    out_img = np.dstack((binary_warped, binary_warped, binary_warped))
    # Find the peak of the left and right halves of the histogram
    # These will be the starting point for the left and right lines
    midpoint = np.int(histogram.shape[0]//2)
    leftx_base = np.argmax(histogram[:midpoint])
    rightx_base = np.argmax(histogram[midpoint:]) + midpoint

    # HYPERPARAMETERS
    # Choose the number of sliding windows
    nwindows = 9
    # Set the width of the windows +/- margin
    margin = 100
    # Set minimum number of pixels found to recenter window
    minpix = 50

    # Set height of windows - based on nwindows above and image shape
    window_height = np.int(binary_warped.shape[0]//nwindows)
    # Identify the x and y positions of all nonzero pixels in the image
    nonzero = binary_warped.nonzero()
    nonzeroy = np.array(nonzero[0])
    nonzerox = np.array(nonzero[1])
    # Current positions to be updated later for each window in nwindows
    leftx_current = leftx_base
    rightx_current = rightx_base

    # Create empty lists to receive left and right lane pixel indices
    left_lane_inds = []
    right_lane_inds = []

    # Step through the windows one by one
    for window in range(nwindows):
        # Identify window boundaries in x and y (and right and left)
        win_y_low = binary_warped.shape[0] - (window+1)*window_height
        win_y_high = binary_warped.shape[0] - window*window_height
        win_xleft_low = leftx_current - margin
        win_xleft_high = leftx_current + margin
        win_xright_low = rightx_current - margin
        win_xright_high = rightx_current + margin
        
        # Draw the windows on the visualization image
        cv2.rectangle(out_img,(win_xleft_low,win_y_low),(win_xleft_high,win_y_high),(0,255,0), 2) 
        cv2.rectangle(out_img,(win_xright_low,win_y_low),(win_xright_high,win_y_high),(0,255,0), 2) 
        
        # Identify the nonzero pixels in x and y within the window #
        good_left_inds = ((nonzeroy >= win_y_low) & (nonzeroy < win_y_high) & 
        (nonzerox >= win_xleft_low) &  (nonzerox < win_xleft_high)).nonzero()[0]
        good_right_inds = ((nonzeroy >= win_y_low) & (nonzeroy < win_y_high) & 
        (nonzerox >= win_xright_low) &  (nonzerox < win_xright_high)).nonzero()[0]
        
        # Append these indices to the lists
        left_lane_inds.append(good_left_inds)
        right_lane_inds.append(good_right_inds)
        
        # If you found > minpix pixels, recenter next window on their mean position
        if len(good_left_inds) > minpix:
            leftx_current = np.int(np.mean(nonzerox[good_left_inds]))
        if len(good_right_inds) > minpix:        
            rightx_current = np.int(np.mean(nonzerox[good_right_inds]))

    # Concatenate the arrays of indices (previously was a list of lists of pixels)
    try:
        left_lane_inds = np.concatenate(left_lane_inds)
        right_lane_inds = np.concatenate(right_lane_inds)
    except ValueError:
        # Avoids an error if the above is not implemented fully
        pass

    # Extract left and right line pixel positions
    leftx = nonzerox[left_lane_inds]
    lefty = nonzeroy[left_lane_inds] 
    rightx = nonzerox[right_lane_inds]
    righty = nonzeroy[right_lane_inds]

    return leftx, lefty, rightx, righty, out_img


def fit_polynomial(binary_warped):
    # Find our lane pixels first
    leftx, lefty, rightx, righty, out_img = find_lane_pixels(binary_warped)

    # Fit a second order polynomial to each using `np.polyfit`
    left_fit = np.polyfit(lefty, leftx, 2)
    right_fit = np.polyfit(righty, rightx, 2)

    # Generate x and y values for plotting
    ploty = np.linspace(0, binary_warped.shape[0]-1, binary_warped.shape[0] )
    try:
        left_fitx = left_fit[0]*ploty**2 + left_fit[1]*ploty + left_fit[2]
        right_fitx = right_fit[0]*ploty**2 + right_fit[1]*ploty + right_fit[2]
    except TypeError:
        # Avoids an error if `left` and `right_fit` are still none or incorrect
        print('The function failed to fit a line!')
        left_fitx = 1*ploty**2 + 1*ploty
        right_fitx = 1*ploty**2 + 1*ploty
    
    polypoints = {'ploty':ploty, 'left_fitx':left_fitx, 'right_fitx':right_fitx}
    # Define conversions in x and y from pixels space to meters
    ym_per_pix = 30/720 # meters per pixel in y dimension
    xm_per_pix = 3.7/700 # meters per pixel in x dimension
    
    # Define y-value where we want radius of curvature
    # We'll choose the maximum y-value, corresponding to the bottom of the image
    y_eval = np.max(ploty)
    
    ##### TO-DO: Implement the calculation of R_curve (radius of curvature) #####
    left_curverad = ((1 + (2*left_fit[0]*y_eval*ym_per_pix + left_fit[1])**2)**(3/2))/np.absolute(2*left_fit[0])
    right_curverad = ((1 + (2*right_fit[0]*y_eval*ym_per_pix + right_fit[1])**2)**(3/2))/np.absolute(2*right_fit[0])
    
    ### Position
    mid = binary_warped.shape[1] / 2
    xl = left_fit[0] * (y_eval**2) + left_fit[1]*y_eval + left_fit[2]
    xr = right_fit[0] * (y_eval**2) + right_fit[1]*y_eval + right_fit[2]
    pix_pos = xl + (xr - xl) / 2
    vehicle_position = (pix_pos - mid) * xm_per_pix 
    
    ## Visualization ##
    # Colors in the left and right lane regions
    out_img[lefty, leftx] = [255, 0, 0]
    out_img[righty, rightx] = [0, 0, 255]

    return out_img, left_curverad, right_curverad, vehicle_position, polypoints

In [9]:
def output_visual(polypoints, warped_bin, undist_img, Minv):
    
    ploty = polypoints['ploty']
    left_fitx = polypoints['left_fitx']
    right_fitx = polypoints['right_fitx']
    
    # Create an image to draw the lines on
    warp_zero = np.zeros_like(warped_bin).astype(np.uint8)
    color_warp = np.dstack((warp_zero, warp_zero, warp_zero))
    
    # Recast the x and y points into usable format for cv2.fillPoly()
    pts_left = np.array([np.transpose(np.vstack([left_fitx, ploty]))])
    pts_right = np.array([np.flipud(np.transpose(np.vstack([right_fitx, ploty])))])
    pts = np.hstack((pts_left, pts_right))
    
    # Draw the lane onto the warped blank image
    cv2.fillPoly(color_warp, np.int_([pts]), (0,255, 0))
    cv2.polylines(color_warp, np.int32([pts_left]), isClosed=False, color=(255,0,0), thickness=15)
    cv2.polylines(color_warp, np.int32([pts_right]), isClosed=False, color=(0,0,255), thickness=15)
    
    # Warp the blank back to original image space using inverse perspective matrix (Minv)
    newwarp = cv2.warpPerspective(color_warp, Minv, (undist_img.shape[1], undist_img.shape[0]))
    
    # Combine the result with the original image
    result = cv2.addWeighted(undist_img, 1, newwarp, 0.3, 0)
    
    return result

In [14]:
import timeit

calib_images = glob.glob('camera_cal/calibration*.jpg')
test_images = glob.glob('test_images/*.jpg')
test_img = mpimg.imread(test_images[0])
mtx, dist = calib_distort(calib_images)


def pipeline(test_img):
    ### Distortion correction to raw images
    undist_img = cv2.undistort(test_img, mtx, dist, None, mtx)
    ### Color transforms, gradients, etc., to create a thresholded binary image.
    ksize = 3 

    gradx = abs_sobel_thresh(undist_img, orient='x', sobel_kernel=ksize, thresh=(9, 100))
    mag_binary = mag_thresh(undist_img, sobel_kernel=ksize, mag_thresh=(30, 100))
    dir_binary = dir_threshold(undist_img, sobel_kernel=ksize, thresh=(0.7, 1.3))
    S_binary = hls_thresh(undist_img, ctype='S',thresh=(130, 200))

    combined_binary = np.zeros_like(gradx)
    combined_binary[(((gradx == 1) & (mag_binary == 1) & (dir_binary == 1)) | (S_binary == 1)) ] = 1

    ### Perspective transform to rectify binary image
    warped_bin, Minv = wrap(combined_binary)

    ### Detect lanes, curvature and vehicule position
    out_img, left_curverad, right_curverad, vehicle_position, polypoints = fit_polynomial(warped_bin)

    ### Unwrap and visualize
    results = output_visual(polypoints, warped_bin, undist_img, Minv)
    
    font = cv2.FONT_HERSHEY_SIMPLEX
    signs = {-1:'left', 1:'right'}
    cv2.putText(results, 'Radius of Curvature = {}m'.format(int(right_curverad)), (50,100), font, 1, (255, 255, 0), 2, cv2.LINE_AA)
    cv2.putText(results, 'The vehicule is {}m to the {} of the center'.format(np.round(vehicle_position,2), signs[np.sign(vehicle_position)]), (50,150), font, 1, (255, 255, 0), 2, cv2.LINE_AA)
        
    return results

In [36]:
for image in test_images:
    test_img = cv2.imread(image)
    result = pipeline(test_img)
    cv2.imwrite('output_images/{}'.format(image[12:]), result)

In [37]:
white_output = 'output_video.mp4'
clip1 = VideoFileClip('project_video.mp4')
white_clip = clip1.fl_image(pipeline) #NOTE: this function expects color images!!
%time white_clip.write_videofile(white_output, audio=False)

[MoviePy] >>>> Building video output_video.mp4
[MoviePy] Writing video output_video.mp4



  0%|          | 0/1261 [00:00<?, ?it/s][A
  0%|          | 1/1261 [00:00<05:20,  3.93it/s][A
  0%|          | 2/1261 [00:00<05:31,  3.80it/s][A
  0%|          | 3/1261 [00:00<05:26,  3.85it/s][A
  0%|          | 4/1261 [00:01<05:16,  3.98it/s][A
  0%|          | 5/1261 [00:01<05:10,  4.05it/s][A
  0%|          | 6/1261 [00:01<05:01,  4.17it/s][A
  1%|          | 7/1261 [00:01<05:00,  4.17it/s][A
  1%|          | 8/1261 [00:01<04:51,  4.30it/s][A
  1%|          | 9/1261 [00:02<04:49,  4.32it/s][A
  1%|          | 10/1261 [00:02<04:44,  4.39it/s][A
  1%|          | 11/1261 [00:02<04:52,  4.27it/s][A
  1%|          | 12/1261 [00:02<04:48,  4.33it/s][A
  1%|          | 13/1261 [00:03<04:50,  4.30it/s][A
  1%|          | 14/1261 [00:03<04:46,  4.35it/s][A
  1%|          | 15/1261 [00:03<04:50,  4.29it/s][A
  1%|▏         | 16/1261 [00:03<04:46,  4.34it/s][A
  1%|▏         | 17/1261 [00:04<04:48,  4.31it/s][A
  1%|▏         | 18/1261 [00:04<04:45,  4.36it/s][A
  2%|▏    

[MoviePy] Done.
[MoviePy] >>>> Video ready: output_video.mp4 

CPU times: user 3min 35s, sys: 1min 1s, total: 4min 37s
Wall time: 6min 48s


In [38]:
HTML("""
<video width="960" height="540" controls>
  <source src="{0}">
</video>
""".format(white_output))