Imports, Parameters, and Object Points

In [2]:
import cv2
import numpy as np
import glob

# Setting the expected chessboard pattern size (number of inner corners)
pattern_size = (9, 6)
square_size = 21.7  # length of each square in mm

# Preparing the object points (3D points in the chessboard coordinate system)
objp = np.zeros((pattern_size[0]*pattern_size[1], 3), np.float32)
objp[:, :2] = np.mgrid[0:pattern_size[0], 0:pattern_size[1]].T.reshape(-1, 2)
objp *= square_size

# Lists to store all object points and image points
object_points_all = []   # 3D points in real-world space
image_points_all = []    # 2D points in the image plane

# For images that were processed automatically
object_points_auto = []
image_points_auto = []

training_files = glob.glob('training_images/*.jpg')

Helper functions for corner detection

In [4]:
# CHOICE 5: Enhance input for automatic detection
# Function that enhances the input image to improve automatic chessboard corner detection
def preprocess_image(img):
    gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
    gray_eq = cv2.equalizeHist(gray)
    gray_blur = cv2.medianBlur(gray_eq, 5)
    return gray_blur

# Function that allows automatic inner corner detection using OpenCV's chessboard detection functions
def detect_corners_automatically(img, pattern_size):
    preprocessed = preprocess_image(img)
    try:
        ret, corners = cv2.findChessboardCornersSB(preprocessed, pattern_size, None)
    except Exception:
        # Fall back to findChessboardCorners with flags if findChessboardCornersSB is unavailable
        flags = cv2.CALIB_CB_ADAPTIVE_THRESH + cv2.CALIB_CB_NORMALIZE_IMAGE
        ret, corners = cv2.findChessboardCorners(preprocessed, pattern_size, flags)
    return ret, corners

# Function that provides an interactive manual annotation interface
# Choice 3: Improves the localization of the four corner points by providing zoomed-in feedback, undo, and confirmation
def get_manual_corners(img):
    clicked_points = []
    img_copy = img.copy()
    original_img = img.copy()  # used to redraw the image after undo

    # Function to update the display of the manual annotation window
    def update_display():
        nonlocal img_copy
        img_copy = original_img.copy()
        for pt in clicked_points:
            cv2.circle(img_copy, (int(pt[0]), int(pt[1])), 5, (0, 0, 255), -1)
            font = cv2.FONT_HERSHEY_SIMPLEX
            cv2.putText(img_copy, f"{int(pt[0])},{int(pt[1])}", (int(pt[0]), int(pt[1])),
                        font, 0.5, (0, 0, 255), 1)
        cv2.imshow("Manual Annotation", img_copy)

     # Function that displays a zoomed-in view to help the user click more precisely
    def zoom_click_refinement(img, point, zoom_factor=4, window_size=400):
        x, y = int(point[0]), int(point[1])
        h, w = img.shape[:2]
        half = window_size // 2
        x1 = max(x - half, 0)
        y1 = max(y - half, 0)
        x2 = min(x + half, w)
        y2 = min(y + half, h)
        roi = img[y1:y2, x1:x2]
        zoomed = cv2.resize(roi, (roi.shape[1]*zoom_factor, roi.shape[0]*zoom_factor))
        win_name = "Zoomed Refinement"
        cv2.namedWindow(win_name, cv2.WINDOW_NORMAL)
        cv2.imshow(win_name, zoomed)
        refined_point = None

        # Callback function for the zoomed-in refinement window
        def zoom_callback(event, zx, zy, flags, param):
            nonlocal refined_point
            if event == cv2.EVENT_LBUTTONDOWN:
                rx = zx / zoom_factor
                ry = zy / zoom_factor
                refined_point = (x1 + rx, y1 + ry)
                cv2.destroyWindow(win_name)

        cv2.setMouseCallback(win_name, zoom_callback)
        while refined_point is None:
            key = cv2.waitKey(1)
            if key == 27:  # Esc cancels refinement
                refined_point = point
                cv2.destroyWindow(win_name)
                break
        return refined_point
    
    #  Mouse callback function to capture clicks using zoomed-in refinement
    def click_event(event, x, y, _flags, _params):
        nonlocal clicked_points, img_copy
        if event == cv2.EVENT_LBUTTONDOWN:
            initial_point = (x, y)
            refined = zoom_click_refinement(img, initial_point)
            clicked_points.append(refined)
            update_display()
            print(f"Point selected: {refined}")

    cv2.namedWindow("Manual Annotation", cv2.WINDOW_NORMAL)
    cv2.resizeWindow("Manual Annotation", 1280, 720)
    cv2.imshow("Manual Annotation", img_copy)
    cv2.setMouseCallback("Manual Annotation", click_event)

    print("Please click on the 4 outer corners of the chessboard in the following order:")
    print("1. Top-Left")
    print("2. Top-Right")
    print("3. Bottom-Right")
    print("4. Bottom-Left")
    print("Press 'u' to undo the last click. After 4 clicks, press 'a' to accept or 'u' to undo the final click.")

    while True:
        cv2.imshow("Manual Annotation", img_copy)
        key = cv2.waitKey(1) & 0xFF
        if key == ord('u'):
            if clicked_points:
                clicked_points.pop()
                update_display()
                print("Undid the last click.")
        if len(clicked_points) == 4:
            print("4 points have been selected. Press 'a' to accept these points, or 'u' to undo the final click.")
            key_confirm = cv2.waitKey(0) & 0xFF
            if key_confirm == ord('a'):
                break
            elif key_confirm == ord('u'):
                if clicked_points:
                    clicked_points.pop()
                    update_display()
                    print("Undid the last click. Please click again.")
        if key == 27:  # Esc key
            print("Manual annotation canceled. Not enough points selected.")
            break

    cv2.destroyWindow("Manual Annotation")

    if len(clicked_points) == 4:
        return clicked_points
    else:
        return None
    
# Function that linearly interpolates all chessboard points from the given outer corners
def interpolate_with_homography(corners, grid_size):
    num_cols, num_rows = grid_size

    # Define the ideal source points in a rectified coordinate system for the inner corners
    src_points = np.array([
        [0, 0],                     # top-left of inner corners
        [num_cols - 1, 0],          # top-right of inner corners
        [num_cols - 1, num_rows - 1],  # bottom-right
        [0, num_rows - 1]           # bottom-left
    ], dtype=np.float32)
    dst_points = np.array(corners, dtype=np.float32)
    H = cv2.getPerspectiveTransform(src_points, dst_points)

    # Generate the full grid of points using a list comprehension and convert to a NumPy array
    grid_points = np.array([[j, i] for i in range(num_rows) for j in range(num_cols)], dtype=np.float32)
    
    # Reshape grid_points to (num_rows, num_cols, 2)
    grid_points = grid_points.reshape(num_rows, num_cols, 2)
            
    # Transform the full grid to image points using the homography
    full_points = cv2.perspectiveTransform(grid_points.reshape(-1, 1, 2), H)
    full_points = full_points.reshape(num_rows, num_cols, 2)
    
    # Extract only the inner points (exclude the outer rows and columns)
    inner_points = full_points[1:-1, 1:-1, :]
    return inner_points.reshape(-1, 2)

# Function that determines whether the chessboard is placed vertically or horizontally
def determine_grid_size(corners, horizontal_grid_size=11, vertical_grid_size=8):
    tl = np.array(corners[0], dtype=np.float32)
    tr = np.array(corners[1], dtype=np.float32)
    bl = np.array(corners[3], dtype=np.float32)
    width = np.linalg.norm(tr - tl)
    height = np.linalg.norm(bl - tl)
    if width >= height:
        return (horizontal_grid_size, vertical_grid_size)
    else:
        return (vertical_grid_size, horizontal_grid_size)

Process Each Training Image

In [6]:
for idx, fname in enumerate(training_files):
    print(f"\nProcessing image: {fname}")
    img_train = cv2.imread(fname)
    if img_train is None:
        print("Failed to load image.")
        continue
    # Attempt automatic corner detection
    ret, corners = detect_corners_automatically(img_train, pattern_size)
    
    if ret:
        print("Automatic corner detection succeeded.")
         # Refine corner positions for better accuracy
        criteria = (cv2.TERM_CRITERIA_EPS + cv2.TERM_CRITERIA_MAX_ITER, 30, 0.001)
        corners_refined = cv2.cornerSubPix(cv2.cvtColor(img_train, cv2.COLOR_BGR2GRAY), corners, (11, 11), (-1, -1), criteria)

        # Add the refined corners and corresponding object points
        object_points_all.append(objp)
        image_points_all.append(corners_refined)

        # Store these in the automatic lists
        object_points_auto.append(objp)
        image_points_auto.append(corners_refined)

        # Draw the detected corners
        img_auto = img_train.copy()
        cv2.drawChessboardCorners(img_auto, pattern_size, corners_refined, ret)
        cv2.namedWindow("Automatic Corners", cv2.WINDOW_NORMAL)
        cv2.imshow("Automatic Corners", img_auto)
        cv2.waitKey(0)
        cv2.destroyAllWindows()
    else:
        print("Automatic corner detection failed; invoking manual annotation.")
        manual_corners = get_manual_corners(img_train)
        if manual_corners is not None:
            grid_size_manual = determine_grid_size(manual_corners, horizontal_grid_size=11, vertical_grid_size=8)
            corners_manual_full = interpolate_with_homography(manual_corners, grid_size_manual)

            # Add the refined corners and corresponding object points
            object_points_all.append(objp)
            image_points_all.append(corners_manual_full)

            # Draw the detected corners
            img_with_points = img_train.copy()
            for pt in corners_manual_full:
                x, y = int(pt[0]), int(pt[1])
                cv2.circle(img_with_points, (x, y), 3, (255, 0, 0), -1)
            cv2.namedWindow("Interpolated Points", cv2.WINDOW_NORMAL)
            cv2.resizeWindow("Interpolated Points", 1280, 720)
            cv2.imshow("Interpolated Points", img_with_points)
            cv2.waitKey(0)
            cv2.destroyWindow("Interpolated Points")
        else:
            print("Skipping image since manual annotation is not available.")


Processing image: training_images/WIN_20250211_11_12_06_Pro.jpg
Automatic corner detection succeeded.


2025-02-16 19:35:55.659 python[58723:16866021] +[IMKClient subclass]: chose IMKClient_Modern
2025-02-16 19:35:55.659 python[58723:16866021] +[IMKInputSession subclass]: chose IMKInputSession_Modern



Processing image: training_images/WIN_20250211_10_59_26_Pro.jpg
Automatic corner detection succeeded.

Processing image: training_images/WIN_20250213_09_15_48_Pro.jpg
Automatic corner detection succeeded.

Processing image: training_images/WIN_20250212_12_24_50_Pro.jpg
Automatic corner detection succeeded.

Processing image: training_images/WIN_20250212_12_24_40_Pro.jpg
Automatic corner detection succeeded.

Processing image: training_images/WIN_20250213_09_07_56_Pro.jpg
Automatic corner detection failed; invoking manual annotation.
Please click on the 4 outer corners of the chessboard in the following order:
1. Top-Left
2. Top-Right
3. Bottom-Right
4. Bottom-Left
Press 'u' to undo the last click. After 4 clicks, press 'a' to accept or 'u' to undo the final click.
Point selected: (98.25, 230.25)
Point selected: (1661.0, 193.0)
Point selected: (1357.75, 576.75)
Point selected: (469.0, 605.75)
4 points have been selected. Press 'a' to accept these points, or 'u' to undo the final click.

Process the final test image

In [None]:
# Load the final test image
final_test_file = "final_test.jpg"
img_final = cv2.imread(final_test_file)
if img_final is None:
    print("Error: Could not load final test image.")
else:
    # Convert the image to grayscale
    gray_final = cv2.cvtColor(img_final, cv2.COLOR_BGR2GRAY)
    
    # Attempt automatic corner detection using your previously defined function
    ret, corners_final = detect_corners_automatically(gray_final, pattern_size)
    
    print("Final Test Image - Detection flag (ret):", ret)
    
    if ret:
        print("Automatic corner detection succeeded on the final test image.")
        # Refine the detected corners for better accuracy
        criteria = (cv2.TERM_CRITERIA_EPS + cv2.TERM_CRITERIA_MAX_ITER, 30, 0.001)
        corners_final_refined = cv2.cornerSubPix(gray_final, corners_final, (11, 11), (-1, -1), criteria)

        # Add the refined corners and corresponding object points
        object_points_all.append(objp)
        image_points_all.append(corners_refined)
        
        # Also store these in the automatic lists
        object_points_auto.append(objp)
        image_points_auto.append(corners_refined)
        
        # Draw the detected corners on a copy of the final image
        img_final_drawn = img_final.copy()
        cv2.drawChessboardCorners(img_final_drawn, pattern_size, corners_final_refined, ret)
        
        # Display the final test image with detected corners
        cv2.namedWindow("Final Test Automatic Detection", cv2.WINDOW_NORMAL)
        cv2.imshow("Final Test Automatic Detection", img_final_drawn)
        cv2.waitKey(0)
        cv2.destroyAllWindows()
    else:
        print("Automatic corner detection failed on the final test image. Please check the image conditions.")

Camera Calibration Runs

In [None]:
# Determine image size
img_example = cv2.imread(training_files[0])
img_size = (img_example.shape[1], img_example.shape[0])
print("\nImage size (width x height):", img_size)

# Run 1: Use all training images
ret1, cameraMatrix1, distCoeffs1, rvecs1, tvecs1 = cv2.calibrateCamera(
    object_points_all, image_points_all, img_size, None, None)
print("\nRun 1 Calibration Results (All Images):")
print("Camera Matrix:\n", cameraMatrix1)
print("Distortion Coefficients:\n", distCoeffs1)

# Run 2: Use only 10 images with automatic corner detections
if len(object_points_auto) >= 10:
    objpoints_run2 = object_points_auto[:10]
    imgpoints_run2 = image_points_auto[:10]
else:
    print("Not enough automatic images for Run 2; using available automatic images.")
    objpoints_run2 = object_points_auto
    imgpoints_run2 = image_points_auto

ret2, cameraMatrix2, distCoeffs2, rvecs2, tvecs2 = cv2.calibrateCamera(
    objpoints_run2, imgpoints_run2, img_size, None, None)
print("\nRun 2 Calibration Results (10 Automatic Images):")
print("Camera Matrix:\n", cameraMatrix2)
print("Distortion Coefficients:\n", distCoeffs2)

# Run 3: Use only 5 images from the automatic ones
if len(objpoints_run2) >= 5:
    objpoints_run3 = objpoints_run2[:5]
    imgpoints_run3 = imgpoints_run2[:5]
else:
    print("Not enough images for Run 3; using available images from Run 2.")
    objpoints_run3 = objpoints_run2
    imgpoints_run3 = imgpoints_run2

ret3, cameraMatrix3, distCoeffs3, rvecs3, tvecs3 = cv2.calibrateCamera(
    objpoints_run3, imgpoints_run3, img_size, None, None)
print("\nRun 3 Calibration Results (5 Automatic Images):")
print("Camera Matrix:\n", cameraMatrix3)
print("Distortion Coefficients:\n", distCoeffs3)

Testing the calibration (will take out when submitting)

In [None]:
# (After calibration runs, for example, after Cell 4)

# Re-read the first training image (or choose any other image that shows the chessboard)
img = cv2.imread(training_files[4])
if img is None:
    print("Error: Could not load the training image for overlay.")
    exit()

# Define 3D points for coordinate axes (length = 3 squares, for example)
axis = np.float32([[3*square_size, 0, 0],
                   [0, 3*square_size, 0],
                   [0, 0, -3*square_size]]).reshape(-1, 3)

# Use the rotation and translation vectors from one of the calibration images.
# Here we use the first set from Run 1 (rvecs1[0] and tvecs1[0]).
# Project the 3D axis points to the image plane using the first calibration image's pose.
imgpts, _ = cv2.projectPoints(axis, rvecs1[4], tvecs1[4], cameraMatrix1, distCoeffs1)

# Convert the reference corner (e.g., the first detected chessboard corner) to integer coordinates.
corner = tuple(map(int, image_points_all[4][0].ravel()))

# Convert the projected axis points to integer coordinates.
x_axis = tuple(map(int, imgpts[0].ravel()))
y_axis = tuple(map(int, imgpts[1].ravel()))
z_axis = tuple(map(int, imgpts[2].ravel()))

# Copy the image for drawing the axes.
img_axes = img.copy()
img_axes = cv2.line(img_axes, corner, x_axis, (255, 0, 0), 5)  # X-axis in blue
img_axes = cv2.line(img_axes, corner, y_axis, (0, 255, 0), 5)  # Y-axis in green
img_axes = cv2.line(img_axes, corner, z_axis, (0, 0, 255), 5)  # Z-axis in red

cv2.namedWindow("3D Axes Overlay", cv2.WINDOW_NORMAL)
cv2.imshow("3D Axes Overlay", img_axes)
cv2.waitKey(0)
cv2.destroyAllWindows()

Online Phase

In [None]:
# Function to calculate color based on position and orientation
def calculate_hsv_color(rvec, tvec, top_plane_normal=[0, 0, 1]):
    # Calculate distance to camera (for intensity/value)
    distance = np.linalg.norm(tvec)
    value = max(0, 255 * (1 - distance/4))  # Linear scaling 0-4m to 255-0
    
    # Calculate angle between camera and top plane normal (for saturation)
    R, _ = cv2.Rodrigues(rvec)
    transformed_normal = R.dot(top_plane_normal)
    angle = np.arccos(transformed_normal[2]) * 180/np.pi  # Angle in degrees
    saturation = max(0, 255 * (1 - angle/45))  # Linear scaling 0-45deg to 255-0
    
    # Calculate hue based on relative position
    # Using horizontal position (x-coordinate) for hue
    hue = (np.arctan2(tvec[0][0], tvec[2][0]) + np.pi) * 180/np.pi
    
    return np.uint8([[[hue, saturation, value]]])


# Function to draw cube and axes
def draw_cube_and_axes(img, rvec, tvec, camera_matrix, dist_coeffs, square_size):
    # Define 3D points for coordinate axes (length = 3 squares)
    axis_length = 3 * square_size
    axes = np.float32([[0,0,0], [axis_length,0,0], [0,axis_length,0], [0,0,-axis_length]])
    
    # Define cube points (2x2x2 squares)
    cube_size = 2 * square_size
    cube_points = np.float32([
        [0,0,0], [cube_size,0,0], [cube_size,cube_size,0], [0,cube_size,0],
        [0,0,-cube_size], [cube_size,0,-cube_size], 
        [cube_size,cube_size,-cube_size], [0,cube_size,-cube_size]
    ])
    
    # Project points
    imgpts_axes, _ = cv2.projectPoints(axes, rvec, tvec, camera_matrix, dist_coeffs)
    imgpts_cube, _ = cv2.projectPoints(cube_points, rvec, tvec, camera_matrix, dist_coeffs)
    
    # Draw axes
    origin = tuple(map(int, imgpts_axes[0].ravel()))
    img = cv2.line(img, origin, tuple(map(int, imgpts_axes[1].ravel())), (255,0,0), 3)  # X axis
    img = cv2.line(img, origin, tuple(map(int, imgpts_axes[2].ravel())), (0,255,0), 3)  # Y axis
    img = cv2.line(img, origin, tuple(map(int, imgpts_axes[3].ravel())), (0,0,255), 3)  # Z axis
    
    # Draw cube
    imgpts_cube = np.int32(imgpts_cube).reshape(-1,2)
    
    # Draw bottom face
    img = cv2.drawContours(img, [imgpts_cube[:4]], -1, (0,255,0), 3)
    
    # Draw top face
    img = cv2.drawContours(img, [imgpts_cube[4:]], -1, (0,255,0), 3)
    
    # Draw vertical edges
    for i in range(4):
        img = cv2.line(img, tuple(imgpts_cube[i]), tuple(imgpts_cube[i+4]), (0,255,0), 3)
    
    # Get color for top polygon based on position and orientation
    hsv_color = calculate_hsv_color(rvec, tvec)
    bgr_color = cv2.cvtColor(hsv_color, cv2.COLOR_HSV2BGR).squeeze()
    
    # Draw filled top polygon
    top_face = imgpts_cube[4:].reshape((-1,1,2))
    cv2.fillConvexPoly(img, top_face, bgr_color.tolist())
    
    return img


# Process test image with all three calibration results
test_img = cv2.imread("final_test.jpg")
gray_test = cv2.cvtColor(test_img, cv2.COLOR_BGR2GRAY)
ret, corners = detect_corners_automatically(gray_test, pattern_size)

if ret:
    criteria = (cv2.TERM_CRITERIA_EPS + cv2.TERM_CRITERIA_MAX_ITER, 30, 0.001)
    corners = cv2.cornerSubPix(gray_test, corners, (11,11), (-1,-1), criteria)
    
    # Process with each calibration result
    for run, (camera_matrix, dist_coeffs) in enumerate([
        (cameraMatrix1, distCoeffs1),
        (cameraMatrix2, distCoeffs2),
        (cameraMatrix3, distCoeffs3)
    ], 1):
        # Find pose
        _, rvec, tvec = cv2.solvePnP(objp, corners, camera_matrix, dist_coeffs)
        
        # Draw results
        img_result = test_img.copy()
        img_result = draw_cube_and_axes(img_result, rvec, tvec, camera_matrix, dist_coeffs, square_size)
        
        # Display result
        cv2.namedWindow(f"Run {run} Result", cv2.WINDOW_NORMAL)
        cv2.imshow(f"Run {run} Result", img_result)
        cv2.waitKey(0)
        
    cv2.destroyAllWindows()
else:
    print("Could not detect corners in test image automatically")
