In [1]:
import numpy as np
import pandas as pd
import cv2
import os
import glob
import matplotlib.pyplot as plt
import pickle

%matplotlib inline

In [2]:
def undistort_img():
    # Prepare object points 0,0,0 ... 8,5,0
    obj_pts = np.zeros((6 * 9, 3), np.float32)
    obj_pts[:, :2] = np.mgrid[0:9, 0:6].T.reshape(-1, 2)

    # Stores all object points & img points from all images
    objpoints = []
    imgpoints = []

    # Get directory for all calibration images
    images = glob.glob('camera_cal/*.jpg')

    for indx, fname in enumerate(images):
        img = cv2.imread(fname)
        gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)

        ret, corners = cv2.findChessboardCorners(gray, (9, 6), None)

        if ret == True:
            objpoints.append(obj_pts)
            imgpoints.append(corners)
    
    # Test undistortion on img
    img_size = (1280, 720)

    # Calibrate camera
    ret, mtx, dist, rvecs, tvecs = cv2.calibrateCamera(objpoints, imgpoints, img_size, None, None)

    # Create a sample image for undistortion (you can replace this with your actual image)
    sample_img = np.zeros((720, 1280), dtype=np.uint8)  # Assuming a grayscale image
    dst = cv2.undistort(sample_img, mtx, dist, None, mtx)

    # Save camera calibration for later use
    dist_pickle = {}
    dist_pickle['mtx'] = mtx
    dist_pickle['dist'] = dist
    pickle.dump(dist_pickle, open('camera_cal/cal_pickle.p', 'wb'))

def undistort(img, cal_dir='camera_cal/cal_pickle.p'):
    #cv2.imwrite('camera_cal/test_cal.jpg', dst)
    with open(cal_dir, mode='rb') as f:
        file = pickle.load(f)
    mtx = file['mtx']
    dist = file['dist']
    dst = cv2.undistort(img, mtx, dist, None, mtx)
    
    return dst

In [3]:
undistort_img()

In [4]:
def pipeline(img, s_thresh=(100, 255), sx_thresh=(15, 255)):
    img = undistort(img)
    img = np.copy(img)
    # Convert to HLS color space and separate the V channel
    hls = cv2.cvtColor(img, cv2.COLOR_RGB2HLS).astype(float)
    l_channel = hls[:,:,1]
    s_channel = hls[:,:,2]
    h_channel = hls[:,:,0]
    # Sobel x
    sobelx = cv2.Sobel(l_channel, cv2.CV_64F, 1, 1) # Take the derivative in x
    abs_sobelx = np.absolute(sobelx) # Absolute x derivative to accentuate lines away from horizontal
    scaled_sobel = np.uint8(255*abs_sobelx/np.max(abs_sobelx))
    
    # Threshold x gradient
    sxbinary = np.zeros_like(scaled_sobel)
    sxbinary[(scaled_sobel >= sx_thresh[0]) & (scaled_sobel <= sx_thresh[1])] = 1
    
    # Threshold color channel
    s_binary = np.zeros_like(s_channel)
    s_binary[(s_channel >= s_thresh[0]) & (s_channel <= s_thresh[1])] = 1
    
    color_binary = np.dstack((np.zeros_like(sxbinary), sxbinary, s_binary)) * 255
    
    combined_binary = np.zeros_like(sxbinary)
    combined_binary[(s_binary == 1) | (sxbinary == 1)] = 1
    return combined_binary

def perspective_warp(img,
                     dst_size=(1280, 720),  # Change this line
                     src=np.float32([(0.43, 0.65), (0.58, 0.65), (0.1, 1), (1, 1)]),
                     dst=np.float32([(0, 0), (1, 0), (0, 1), (1, 1)])):
    img_size = np.float32([(img.shape[1],img.shape[0])])
    src = src* img_size
    # For destination points, I'm arbitrarily choosing some points to be
    # a nice fit for displaying our warped result 
    # again, not exact, but close enough for our purposes
    dst = dst * np.float32(dst_size)
    # Given src and dst points, calculate the perspective transform matrix
    M = cv2.getPerspectiveTransform(src, dst)
    # Warp the image using OpenCV warpPerspective()
    warped = cv2.warpPerspective(img, M, dst_size)
    return warped

def inv_perspective_warp(img,
                         dst_size=(1280, 720),  # Change this line
                         src=np.float32([(0, 0), (1, 0), (0, 1), (1, 1)]),
                         dst=np.float32([(0.43, 0.65), (0.58, 0.65), (0.1, 1), (1, 1)])):
    img_size = np.float32([(img.shape[1],img.shape[0])])
    src = src* img_size
    # For destination points, I'm arbitrarily choosing some points to be
    # a nice fit for displaying our warped result 
    # again, not exact, but close enough for our purposes
    dst = dst * np.float32(dst_size)
    # Given src and dst points, calculate the perspective transform matrix
    M = cv2.getPerspectiveTransform(src, dst)
    # Warp the image using OpenCV warpPerspective()
    warped = cv2.warpPerspective(img, M, dst_size)
    return warped

def get_hist(img):
    hist = np.sum(img[img.shape[0]//2:,:], axis=0)
    return hist

In [5]:
left_a, left_b, left_c = [],[],[]
right_a, right_b, right_c = [],[],[]

def sliding_window(img, nwindows=9, margin=150, minpix=1, draw_windows=True):
    global left_a, left_b, left_c, right_a, right_b, right_c 
    left_fit_ = np.empty(3)
    right_fit_ = np.empty(3)
    out_img = np.dstack((img, img, img))*255

    histogram = get_hist(img)
    # find peaks of left and right halves
    midpoint = int(histogram.shape[0]/2)
    leftx_base = np.argmax(histogram[:midpoint])
    rightx_base = np.argmax(histogram[midpoint:]) + midpoint
    
    # Set height of windows
    window_height = int(img.shape[0]/nwindows)
    # Identify the x and y positions of all nonzero pixels in the image
    nonzero = img.nonzero()
    nonzeroy = np.array(nonzero[0])
    nonzerox = np.array(nonzero[1])
    # Current positions to be updated for each window
    leftx_current = leftx_base
    rightx_current = rightx_base
    
    # Create empty lists to receive left and right lane pixel indices
    left_lane_inds = []
    right_lane_inds = []

    # Step through the windows one by one
    for window in range(nwindows):
        # Identify window boundaries in x and y (and right and left)
        win_y_low = img.shape[0] - (window+1)*window_height
        win_y_high = img.shape[0] - window*window_height
        win_xleft_low = leftx_current - margin
        win_xleft_high = leftx_current + margin
        win_xright_low = rightx_current - margin
        win_xright_high = rightx_current + margin
        # Draw the windows on the visualization image
        if draw_windows == True:
            cv2.rectangle(out_img,(win_xleft_low,win_y_low),(win_xleft_high,win_y_high),
            (100,255,255), 3) 
            cv2.rectangle(out_img,(win_xright_low,win_y_low),(win_xright_high,win_y_high),
            (100,255,255), 3) 
        # Identify the nonzero pixels in x and y within the window
        good_left_inds = ((nonzeroy >= win_y_low) & (nonzeroy < win_y_high) & 
        (nonzerox >= win_xleft_low) &  (nonzerox < win_xleft_high)).nonzero()[0]
        good_right_inds = ((nonzeroy >= win_y_low) & (nonzeroy < win_y_high) & 
        (nonzerox >= win_xright_low) &  (nonzerox < win_xright_high)).nonzero()[0]
        # Append these indices to the lists
        left_lane_inds.append(good_left_inds)
        right_lane_inds.append(good_right_inds)
        # If you found > minpix pixels, recenter next window on their mean position
        if len(good_left_inds) > minpix:
            leftx_current = int(np.mean(nonzerox[good_left_inds]))
        if len(good_right_inds) > minpix:        
            rightx_current = int(np.mean(nonzerox[good_right_inds]))

    # Concatenate the arrays of indices
    left_lane_inds = np.concatenate(left_lane_inds)
    right_lane_inds = np.concatenate(right_lane_inds)

    # Check if there are enough pixels to fit the lanes
    if len(left_lane_inds) < minpix or len(right_lane_inds) < minpix:
        return out_img, (None, None), (None, None), None

    # Extract left and right line pixel positions
    leftx = nonzerox[left_lane_inds]
    lefty = nonzeroy[left_lane_inds] 
    rightx = nonzerox[right_lane_inds]
    righty = nonzeroy[right_lane_inds] 

    # Fit a second order polynomial to each
    left_fit = np.polyfit(lefty, leftx, 2)
    right_fit = np.polyfit(righty, rightx, 2)
    
    left_a.append(left_fit[0])
    left_b.append(left_fit[1])
    left_c.append(left_fit[2])
    
    right_a.append(right_fit[0])
    right_b.append(right_fit[1])
    right_c.append(right_fit[2])
    
    left_fit_[0] = np.mean(left_a[-10:])
    left_fit_[1] = np.mean(left_b[-10:])
    left_fit_[2] = np.mean(left_c[-10:])
    
    right_fit_[0] = np.mean(right_a[-10:])
    right_fit_[1] = np.mean(right_b[-10:])
    right_fit_[2] = np.mean(right_c[-10:])
    
    # Generate x and y values for plotting
    ploty = np.linspace(0, img.shape[0]-1, img.shape[0] )
    left_fitx = left_fit_[0]*ploty**2 + left_fit_[1]*ploty + left_fit_[2]
    right_fitx = right_fit_[0]*ploty**2 + right_fit_[1]*ploty + right_fit_[2]

    out_img[nonzeroy[left_lane_inds], nonzerox[left_lane_inds]] = [255, 0, 100]
    out_img[nonzeroy[right_lane_inds], nonzerox[right_lane_inds]] = [0, 100, 255]
    
    return out_img, (left_fitx, right_fitx), (left_fit_, right_fit_), ploty

def get_curve(img, leftx, rightx):
    ploty = np.linspace(0, img.shape[0]-1, img.shape[0])
    y_eval = np.max(ploty)
    ym_per_pix = 30.5/720 # meters per pixel in y dimension
    xm_per_pix = 3.7/720 # meters per pixel in x dimension

    # Fit new polynomials to x,y in world space
    left_fit_cr = np.polyfit(ploty*ym_per_pix, leftx*xm_per_pix, 2)
    right_fit_cr = np.polyfit(ploty*ym_per_pix, rightx*xm_per_pix, 2)
    # Calculate the new radii of curvature
    left_curverad = ((1 + (2*left_fit_cr[0]*y_eval*ym_per_pix + left_fit_cr[1])**2)**1.5) / np.absolute(2*left_fit_cr[0])
    right_curverad = ((1 + (2*right_fit_cr[0]*y_eval*ym_per_pix + right_fit_cr[1])**2)**1.5) / np.absolute(2*right_fit_cr[0])

    car_pos = img.shape[1]/2
    l_fit_x_int = left_fit_cr[0]*img.shape[0]**2 + left_fit_cr[1]*img.shape[0] + left_fit_cr[2]
    r_fit_x_int = right_fit_cr[0]*img.shape[0]**2 + right_fit_cr[1]*img.shape[0] + right_fit_cr[2]
    lane_center_position = (r_fit_x_int + l_fit_x_int) /2
    center = (car_pos - lane_center_position) * xm_per_pix / 10
    # Now our radius of curvature is in meters
    return (left_curverad, right_curverad, center)

def draw_lanes(img, left_fit, right_fit):
    if left_fit is None or right_fit is None:
        return img

    ploty = np.linspace(0, img.shape[0]-1, img.shape[0])
    color_img = np.zeros_like(img)

    left = np.array([np.transpose(np.vstack([left_fit, ploty]))])
    right = np.array([np.flipud(np.transpose(np.vstack([right_fit, ploty])))])
    points = np.hstack((left, right))

    cv2.fillPoly(color_img, np.int_(points),  (255, 200, 0))
    inv_perspective = inv_perspective_warp(color_img)
    inv_perspective = cv2.addWeighted(img, 1, inv_perspective, 0.7, 0)
    return inv_perspective

In [6]:
def vid_pipeline(img):
    global running_avg
    global index

#     # Convert grayscale image to 3-channel image (commenting out the unnecessary conversion)
#     img = cv2.cvtColor(img, cv2.COLOR_GRAY2RGB)

    img_ = pipeline(img)
    img_ = perspective_warp(img_)
    out_img, curves, lanes, ploty = sliding_window(img_, draw_windows=False)

    if curves[0] is not None and curves[1] is not None:
        curverad = get_curve(img, curves[0], curves[1])
        lane_curve = np.mean([curverad[0], curverad[1]])
        img = draw_lanes(img, curves[0], curves[1])

        font = cv2.FONT_HERSHEY_SIMPLEX
        fontColor = (0, 0, 0)
        fontSize = 0.5
        cv2.putText(img, 'Lane Curvature: {:.0f} m'.format(lane_curve), (570, 620), font, fontSize, fontColor, 2)
        cv2.putText(img, 'Vehicle offset: {:.4f} m'.format(curverad[2]), (570, 650), font, fontSize, fontColor, 2)

    return img

Run the below cell to use camera:

In [7]:
import cv2
import depthai as dai
import numpy as np

def get_frame(queue):
    # Get frame from queue
    frame = queue.get()
    # Convert frame to OpenCV format and return
    return frame.getCvFrame()

def get_mono_camera(pipeline, is_left):
    # Configure mono camera
    mono = pipeline.createMonoCamera()
 
    # Set Camera Resolution
    mono.setResolution(dai.MonoCameraProperties.SensorResolution.THE_720_P)

    if is_left:
        # Get left camera
        mono.setBoardSocket(dai.CameraBoardSocket.AUTO)
    else:
        # Get right camera
        mono.setBoardSocket(dai.CameraBoardSocket.AUTO)
    return mono

def get_color_camera(pipeline):
    # Configure color camera
    color = pipeline.createColorCamera()
    
    # Set Camera Resolution
    color.setResolution(dai.ColorCameraProperties.SensorResolution.THE_720_P)
    color.setVideoSize(1280, 720)
    
    # Get main camera
    color.setBoardSocket(dai.CameraBoardSocket.AUTO)
    
    return color

if __name__ == '__main__':
    
    # Define a pipeline
    dai_pipeline = dai.Pipeline()
 
    # Set up left and right cameras
    mono_left = get_mono_camera(dai_pipeline, is_left=True)
    mono_right = get_mono_camera(dai_pipeline, is_left=False)
    
    # Set up main camera
    color_main = get_color_camera(dai_pipeline)
 
    # Set output Xlink for left camera
    xout_left = dai_pipeline.createXLinkOut()
    xout_left.setStreamName("left")
 
    # Set output Xlink for right camera
    xout_right = dai_pipeline.createXLinkOut()
    xout_right.setStreamName("right")
    
    # Set output Xlink for main camera
    xout_main = dai_pipeline.createXLinkOut()
    xout_main.setStreamName("video")
  
    # Attach cameras to output Xlink
    mono_left.out.link(xout_left.input)
    mono_right.out.link(xout_right.input)
    color_main.video.link(xout_main.input)
    
    with dai.Device(dai_pipeline) as device:
        # Get output queues. 
        left_queue = device.getOutputQueue(name="left", maxSize=1)
        right_queue = device.getOutputQueue(name="right", maxSize=1)
        video_queue = device.getOutputQueue(name="video", maxSize=1)

        # Set display window name
        cv2.namedWindow("Stereo Pair")

        # Variable used to toggle between three views
        view_counter = 0
        
        # Initiate capture counter
        existing_images = [int(file.split('.')[0]) for file in os.listdir("capture") if file.endswith('.jpg')]
        if existing_images:
            capture_counter = max(existing_images) + 1
        else:
            capture_counter = 1

        while True:
            
            # Get raw frame
            raw_frame = get_frame(video_queue)
            
            # Get overlayed frame
            overlayed_frame = vid_pipeline(raw_frame)
            
            # Get left frame
            left_frame = get_frame(left_queue)

            # Get right frame 
            right_frame = get_frame(right_queue)

            # Choose the view based on the current counter value
            if view_counter == 0:
                im_out = raw_frame
            elif view_counter == 1:
                im_out = overlayed_frame
            elif view_counter == 2:
                im_out = np.hstack((left_frame, right_frame))
            else:
                im_out = np.uint8(left_frame/2 + right_frame/2)

            # Display output image
            cv2.imshow("Stereo Pair", im_out)

            # Check for keyboard input
            key = cv2.waitKey(1)
            if key == ord('q'):
                # Quit when q is pressed
                break
            elif key == ord('t'):
                # Toggle view when t is pressed
                view_counter = (view_counter + 1) % 4
            elif key == ord('c'):
            # Capture and save images when 'c' is pressed
                frame_name = os.path.join("capture", f"{capture_counter}.jpg")
                cv2.imwrite(frame_name, im_out)
                print(f"Image {capture_counter} captured and saved.")
                capture_counter += 1

        # Release the OpenCV window and clean up resources
        cv2.destroyAllWindows()

Run the below cell to generate an overlayed video:

In [10]:
from IPython.display import display, HTML
from moviepy.editor import VideoFileClip

def overlay_video(input_video):
    """
    Generate video with overlayed lanes and save in 'output' folder
    """
    right_curves, left_curves = [], []

    myclip = VideoFileClip(input_video)
    output_folder = 'output'
    
    # Create 'output' folder if it doesn't exist
    if not os.path.exists(output_folder):
        os.makedirs(output_folder)

    # Get the number of existing files in the 'output' folder
    existing_files = [f for f in os.listdir(output_folder) if os.path.isfile(os.path.join(output_folder, f))]
    output_video_name = f"{len(existing_files) + 1}.mp4"

    output_path = os.path.join(output_folder, output_video_name)
    
    clip = myclip.fl_image(vid_pipeline)
    clip.write_videofile(output_path, audio=False)
    
    display(HTML(f'<video controls src="{output_path}" width="640" height="480"></video>'))

In [11]:
overlay_video('challenge_video.mp4')

Moviepy - Building video output\2.mp4.
Moviepy - Writing video output\2.mp4



                                                                                                                       

Moviepy - Done !
Moviepy - video ready output\2.mp4
