## Importing recipes
%matplotlib inline

import cv2
import numpy as np
import matplotlib.pyplot as plt
import os
from google.colab import drive
# Mounting google drive
drive.mount('/content/drive')

def display_images_in_row(images, cmap='gray'):
    fig, axs = plt.subplots(1, len(images), figsize=(5 * len(images), 5))
    if len(images) == 1:
        axs = [axs]
    for ax, img in zip(axs, images):
        ax.imshow(img, cmap=cmap)
        ax.axis('off')
    plt.tight_layout()
    plt.show()

base_dir = "/content/drive/MyDrive/ES666CV/images/C"  # Base directory containing I1, I2, ..., I5
all_images = []  # List to store restored images

for dataset in sorted(os.listdir(base_dir)):
    dataset_path = os.path.join(base_dir, dataset)
    if not os.path.isdir(dataset_path):
        continue

    # Reference image to get output size
    ref_img_path = os.path.join(dataset_path, "ref_plane_img.png")
    ref_img = cv2.imread(ref_img_path)
    ref_img = cv2.cvtColor(ref_img, cv2.COLOR_BGR2RGB)

    # List to store restored images for this dataset
    images = [ref_img]

    # Loop through warped regions 2,3,4
    for i in range(2, 5):
        warped_img_path = os.path.join(dataset_path, f"warped_region_{i}.png")

        # Load image and homography
        warped_img = cv2.imread(warped_img_path)
        warped_img = cv2.cvtColor(warped_img, cv2.COLOR_BGR2RGB)

        # Inverse warp
        images.append(warped_img)

    # Add restored images for this dataset to the main list
    all_images.append(images)


for idx,imgs in enumerate(all_images):
  print(f"\nDisplaying input images for I{idx+1}: Reference Plane Image, Warped Image 1, Warped Image 2,Warped Image 3")
  display_images_in_row(imgs, cmap=None)

def warpPerspective_from_scratch(img, H, output_shape):
    """
    Inverse warp an image using a given homography matrix H.

    Parameters:
    img : np.array
        Input image to be warped.
    H : np.array
        Homography matrix mapping source -> target plane.
    output_shape : tuple
        (height, width) of the target image.

    Returns:
    restored : np.array
        The warped image of shape output_shape.
    """
    h, w = output_shape
    restored = np.zeros((h, w, img.shape[2]), dtype=img.dtype)

    # Precompute inverse for mapping from output plane to input plane
    H_inv = np.linalg.inv(H)

    for y_out in range(h):
        for x_out in range(w):
            # Create homogeneous coordinates for the output pixel
            out_coords = np.array([x_out, y_out, 1])

            # Map back to input image using inverse homography
            src_coords = H_inv @ out_coords
            src_coords /= src_coords[2]  # Normalize

            x_src, y_src = src_coords[0], src_coords[1]

            # Check if the source coordinates are inside the input image
            if 0 <= x_src <= img.shape[1]-1 and 0 <= y_src <= img.shape[0]-1:
                # Bilinear interpolation
                x0, y0 = int(np.floor(x_src)), int(np.floor(y_src))
                x1, y1 = min(x0 + 1, img.shape[1]-1), min(y0 + 1, img.shape[0]-1)

                dx, dy = x_src - x0, y_src - y0

                for c in range(img.shape[2]):
                    val = (img[y0, x0, c] * (1 - dx) * (1 - dy) +
                           img[y0, x1, c] * dx * (1 - dy) +
                           img[y1, x0, c] * (1 - dx) * dy +
                           img[y1, x1, c] * dx * dy)
                    restored[y_out, x_out, c] = val

    return restored


def restore_images_in_reference_plane(img, H, output_shape):
    """
    Restore a warped image back to the reference plane using inverse homography.

    Parameters:
    img : np.array
        Warped image to be restored.
    H : np.array
        Homography matrix mapping reference -> warped plane.
    output_shape : tuple
        (height, width) of the reference plane.

    Returns:
    warped : np.array
        Restored image in the reference plane.
    """
    h_out, w_out = output_shape

    ## TODO: Compute H inverse: H_inv
    ## TODO: For each pixel in the output (reference) plane, compute the corresponding
    ## pixel location in the warped image using H_inv.
    H_inv = np.linalg.inv(H)

    # Use the warpPerspective function with inverse homography
    warped = warpPerspective_from_scratch(img, H_inv, output_shape)

    return warped

restored_all = []  # List to store restored images

for dataset in sorted(os.listdir(base_dir)):
    dataset_path = os.path.join(base_dir, dataset)
    if not os.path.isdir(dataset_path):
        continue

    print(f"\nProcessing dataset: {dataset}")

    # Reference image to get output size
    ref_img_path = os.path.join(dataset_path, "ref_plane_img.png")
    ref_img = cv2.imread(ref_img_path)
    ref_img = cv2.cvtColor(ref_img, cv2.COLOR_BGR2RGB)
    h_out, w_out = ref_img.shape[:2]

    # Directory containing homography matrices
    homography_dir = os.path.join(dataset_path, "homographies")

    # List to store restored images for this dataset
    restored_dataset = [ref_img]

    # Loop through warped regions 2,3,4
    for i in range(2, 5):
        warped_img_path = os.path.join(dataset_path, f"warped_region_{i}.png")
        H_path = os.path.join(homography_dir, f"H_region_{i}.txt")

        # Load image and homography
        warped_img = cv2.imread(warped_img_path)
        warped_img = cv2.cvtColor(warped_img, cv2.COLOR_BGR2RGB)
        H = np.loadtxt(H_path)

        # Inverse warp
        restored_img = restore_images_in_reference_plane(warped_img, H, (h_out, w_out))
        restored_dataset.append(restored_img)

        # save restored image
        # output_dir = os.path.join(dataset_path, "restored")
        # os.makedirs(output_dir, exist_ok=True)
        # save_path = os.path.join(output_dir, f"restored_warped_region_{i}.png")
        # cv2.imwrite(save_path, restored_img)
        # print(f"Saved: {save_path}")

    # Add restored images for this dataset to the main list
    restored_all.append(restored_dataset)


for idx,imgs in enumerate(restored_all):
  print(f"\nDisplaying restored images for I{idx+1}:")
  display_images_in_row(imgs, cmap=None)

Displaying restored images for I2:

Displaying restored images for I3:

Displaying restored images for I4:

Displaying restored images for I5:

def detect_keypoints_sift(img):
    """
    Detect keypoints and compute descriptors using SIFT.

    Parameters:
    img : np.array
        Input image in which keypoints are to be detected.

    Returns:
    keypoints : list
        Detected keypoints in the image.
    descriptors : np.array
        Feature descriptors corresponding to the keypoints.
    """
    ## TODO: Convert image to grayscale
    gray=cv2.cvtColor(img,cv2.COLOR_RGB2GRAY)

    ## TODO: Detect SIFT keypoints
    sift =cv2.SIFT_create()

    ## TODO: Compute descriptors for the keypoints
    keypoints,descriptors=sift.detectAndCompute(gray, None)

    return keypoints, descriptors

def match_keypoints(des1, des2, ratio_thresh=0.75):
    """
    Match descriptors between two images using nearest neighbor and ratio test.

    Parameters:
    des1 : np.array
        Descriptors from the first image.
    des2 : np.array
        Descriptors from the second image.
    ratio_thresh : float
        Ratio threshold for filtering ambiguous matches.

    Returns:
    good_matches : list
        List of filtered good matches passing the ratio test.
    """
    ## TODO: Match descriptors using nearest neighbor (Using OpenCV)
    bf = cv2.BFMatcher(cv2.NORM_L2, crossCheck=False)
    matches = bf.knnMatch(des1, des2, k=2)

    ## TODO: Apply ratio test to filter matches
    good_matches = []
    for m, n in matches:
        if m.distance < ratio_thresh * n.distance:
            good_matches.append(m)

    return good_matches

def compute_homography_ransac(kp1, kp2, matches, iterations=1000, threshold=5):
    """
    Compute homography using matched keypoints and RANSAC.

    Parameters:
    kp1 : list
        Keypoints from the first image.
    kp2 : list
        Keypoints from the second image.
    matches : list
        Matches between keypoints of the two images.
    iterations : int
        Number of RANSAC iterations.
    threshold : float
        Distance threshold to classify inliers.

    Returns:
    H : np.array
        Estimated homography matrix mapping kp1 -> kp2.
    """
    ## TODO: Implement RANSAC to find the best homography
    ## TODO: Convert keypoints to coordinates
    ## TODO: Iteratively estimate H and count inliers

     # Convert keypoints to NumPy arrays once
    pts1 = np.float32([kp1[m.queryIdx].pt for m in matches])
    pts2 = np.float32([kp2[m.trainIdx].pt for m in matches])

    n_points = len(matches)
    if n_points < 4:
        raise ValueError("Not enough matches to compute homography")

    max_inliers = 0
    best_H = None

    # Pre-allocate homogeneous coordinates to avoid rebuilding every iteration
    pts1_hom = np.hstack([pts1, np.ones((n_points, 1))])

    for _ in range(iterations):
        # Randomly choose 4 correspondences
         idx = np.random.choice(len(pts1), 4, replace=False)
         H = cv2.getPerspectiveTransform(pts1[idx], pts2[idx])
         pts1_transformed = cv2.perspectiveTransform(pts1.reshape(-1, 1, 2), H)
         distances = np.linalg.norm(pts1_transformed.reshape(-1, 2) - pts2, axis=1)
         inliers = np.sum(distances < threshold)

         if inliers > max_inliers:
             max_inliers = inliers
             best_H = H



    return best_H

homographies_all = []  # nested list: [dataset][region_index] -> H

for dataset_idx, dataset_images in enumerate(restored_all):
    print(f"\nProcessing dataset {dataset_idx+1}")
    homographies_dataset = []

    # Use the reference image as base (assume region_1 is at index 0)
    ref_img = dataset_images[0]
    kp_ref, des_ref = detect_keypoints_sift(ref_img)

    # Compute homography for each of the other restored regions
    for region_idx in range(1, len(dataset_images)):
        img = dataset_images[region_idx]
        kp, des = detect_keypoints_sift(img)

        matches = match_keypoints(des, des_ref)


        H = compute_homography_ransac(kp, kp_ref, matches)
        homographies_dataset.append(H)

        print(f"Dataset {dataset_idx+1}, Region {region_idx+1} Homography:\n", H)

        # visualize matches
        img_matches = cv2.drawMatches(img, kp, ref_img, kp_ref, matches[:30], None, flags=2)
        plt.figure(figsize=(12,6))
        plt.imshow(img_matches)
        plt.axis('off')
        plt.show()

    homographies_all.append(homographies_dataset)

Processing dataset 1
Dataset 1, Region 2 Homography:
 [[ 1.00748986e+00  7.64714288e-04  1.61247080e+03]
 [ 2.80265892e-03  1.00305069e+00 -2.12369959e+00]
 [ 2.86266790e-06  3.65196744e-07  1.00000000e+00]]

Dataset 1, Region 3 Homography:
 [[ 1.00356157e+00 -3.94564416e-03 -1.50509922e+00]
 [ 1.55809657e-03  9.99014080e-01  1.20998482e+03]
 [ 1.53620479e-06 -1.62282524e-06  1.00000000e+00]]

Dataset 1, Region 4 Homography:
 [[1.00316123e+00 5.60358195e-03 1.61233672e+03]
 [2.06421531e-03 1.00538736e+00 1.20944498e+03]
 [9.41852280e-07 2.22981271e-06 1.00000000e+00]]

Processing dataset 2
Dataset 2, Region 2 Homography:
 [[ 1.00037108e+00 -7.31640591e-04  8.00052389e+02]
 [-1.76493843e-04  9.99454729e-01  1.95406314e-01]
 [ 6.10369344e-07 -7.35597017e-07  1.00000000e+00]]

Dataset 2, Region 3 Homography:
 [[ 1.01877685e+00 -2.01013263e-02 -2.29758923e+00]
 [ 1.19151436e-02  9.96221084e-01  5.29100076e+02]
 [ 1.56894586e-05 -2.33424897e-05  1.00000000e+00]]

Dataset 2, Region 4 Homography:
 [[1.00979133e+00 6.31894281e-03 7.99856608e+02]
 [4.56404705e-03 1.00708588e+00 5.31874268e+02]
 [7.30161843e-06 8.64121916e-06 1.00000000e+00]]

Processing dataset 3
Dataset 3, Region 2 Homography:
 [[ 1.00076051e+00 -1.45010232e-02  4.12265358e+02]
 [ 1.74575328e-02  9.96119613e-01 -2.54675957e+00]
 [ 2.06006965e-05 -2.19985703e-05  1.00000000e+00]]

Dataset 3, Region 3 Homography:
 [[ 9.84491443e-01  8.58495826e-03  2.07376323e+00]
 [-1.02998382e-02  9.98684631e-01  2.74083388e+02]
 [-2.76402692e-05  3.21945092e-05  1.00000000e+00]]

Dataset 3, Region 4 Homography:
 [[ 7.43614063e-01  1.49346032e+00  3.96188687e+02]
 [-1.94324008e-01  1.85259519e+00  2.71562709e+02]
 [-5.83896062e-04  2.55050968e-03  1.00000000e+00]]

Processing dataset 4
Dataset 4, Region 2 Homography:
 [[ 9.88534742e-01 -1.30693390e-02  1.30749939e+03]
 [-2.86291313e-03  9.84518744e-01  7.25295446e+00]
 [-2.77311013e-06 -8.68913216e-06  1.00000000e+00]]

def stitch_with_known_homographies(base_img, other_imgs, homographies):
    """
    Stitch multiple image regions into the plane of a base image using known homographies.

    Parameters:
    base_img : np.array
        Reference image (Region 1) that serves as the base plane.
    other_imgs : list of np.array
        Restored regions (e.g., Regions 2, 3, 4) to be stitched.
    homographies : list of np.array
        Homography matrices mapping each region to the base image plane.

    Returns:
    stitched_image : np.array
        The final stitched image containing all regions aligned to the base plane.
    """
    ## TODO: Determine the canvas size for stitching
    ## TODO: Place the base image in the canvas
    ## TODO: Translate homographies to canvas coordinates if needed
    ## TODO: Warp each region using your warpPerspective implementation
    ## TODO: Merge warped regions onto the canvas (e.g., simple overwrite or blending)

    h_base, w_base = base_img.shape[:2]

    # 1. Compute canvas bounding box
    # Start with base image corners
    corners = np.array([
        [0, 0, 1],
        [w_base, 0, 1],
        [0, h_base, 1],
        [w_base, h_base, 1]
    ]).T  # shape (3,4)

    all_x, all_y = [], []

    # Add base image corners
    base_corners = corners[:2, :]  # x and y
    all_x.extend(base_corners[0])
    all_y.extend(base_corners[1])

    # Add corners of other images transformed by their homographies
    for img, H in zip(other_imgs, homographies):
        if H is None:
            continue
        h, w = img.shape[:2]
        img_corners = np.array([
            [0, 0, 1],
            [w, 0, 1],
            [0, h, 1],
            [w, h, 1]
        ]).T  # shape (3,4)
        warped_corners = H @ img_corners
        warped_corners /= warped_corners[2, :]
        all_x.extend(warped_corners[0])
        all_y.extend(warped_corners[1])

    # Determine canvas size
    x_min, x_max = int(np.floor(min(all_x))), int(np.ceil(max(all_x)))
    y_min, y_max = int(np.floor(min(all_y))), int(np.ceil(max(all_y)))

    canvas_w = x_max - x_min
    canvas_h = y_max - y_min

    # 2. Initialize canvas
    stitched_image = np.zeros((canvas_h, canvas_w, base_img.shape[2]), dtype=base_img.dtype)

    # Offset to shift base image and warped images into canvas
    offset = np.array([[ -x_min ], [ -y_min ], [0]])

    # 3. Place base image
    for y in range(h_base):
        for x in range(w_base):
            stitched_image[y - y_min, x - x_min] = base_img[y, x]

    # 4. Warp and stitch other images
    for img, H in zip(other_imgs, homographies):
        if H is None:
            continue
        # Shift homography to canvas coordinates
        H_canvas = np.eye(3)
        H_canvas[:3, :3] = H
        H_canvas[:, 2:3] += offset  # adjust translation

        warped_img = warpPerspective_from_scratch(img, H_canvas, (canvas_h, canvas_w))

        mask = np.any(warped_img > 0, axis=2)
        rows, cols = np.where(mask)
        stitched_image[rows, cols] = warped_img[rows, cols]

    return stitched_image

# ----------------------------
# Run stitching on all datasets
# ----------------------------
stitched_all = []
output_dir = "stitched_results"
os.makedirs(output_dir, exist_ok=True)

for dataset_idx, dataset_images in enumerate(restored_all):
    print(f"\n[INFO] Processing dataset {dataset_idx+1}")

    # First image is reference (Region 1)
    ref_img = dataset_images[0]

    # Remaining images are other regions
    other_imgs = dataset_images[1:]

    # Homographies for this dataset
    homographies = homographies_all[dataset_idx]

    # Stitch
    stitched = stitch_with_known_homographies(ref_img, other_imgs, homographies)
    stitched_all.append(stitched)

    # Save
    save_path = os.path.join(output_dir, f"stitched_dataset_{dataset_idx+1}.png")
    cv2.imwrite(save_path, stitched)
    print(f"[INFO] Saved stitched result: {save_path}")

    # Show
    stitched_rgb = stitched
    plt.figure(figsize=(12,6))
    plt.imshow(stitched_rgb)
    plt.title(f"Stitched Result - Dataset {dataset_idx+1}")
    plt.axis("off")
    plt.show()

[INFO] Processing dataset 1
[INFO] Saved stitched result: stitched_results/stitched_dataset_1.png

[INFO] Processing dataset 2
[INFO] Saved stitched result: stitched_results/stitched_dataset_2.png

[INFO] Processing dataset 3
[INFO] Saved stitched result: stitched_results/stitched_dataset_3.png

[INFO] Processing dataset 4
[INFO] Saved stitched result: stitched_results/stitched_dataset_4.png

[INFO] Processing dataset 5
[INFO] Saved stitched result: stitched_results/stitched_dataset_5.png

📜 Gate 3: The Hall of Convergence¶

👁️ The Archivist’s Words¶

🔑 Your Task¶

⚠️ The Archivist’s Warning¶

🎯 Goal¶

Task 1: Implement Inverse Warping from scratch (4 marks)¶

Homography Mapping:¶

Forward Warping vs Inverse Warping¶

Forward Warping¶

Problems with Forward Warping:¶

Inverse Warping¶

Advantages of Inverse Warping:¶

Task 2: Keypoint Detection and Homography Estimation (4 marks)¶

Keypoint Detection and Homography Estimation¶

Mathematical Explanation¶

Consequences¶

Example¶

Task 3: Stitch the Images to Form the Original Image (2 Marks)¶