# Mounting google drive
from google.colab import drive
drive.mount('/content/drive')

Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount("/content/drive", force_remount=True).

pip install scipy

Requirement already satisfied: scipy in /usr/local/lib/python3.12/dist-packages (1.16.3)
Requirement already satisfied: numpy<2.6,>=1.25.2 in /usr/local/lib/python3.12/dist-packages (from scipy) (2.0.2)

# Importing all the required libraries
import numpy as np
import cv2
import matplotlib.pyplot as plt
from matplotlib import style
from glob import glob
from natsort import natsorted

from tqdm import tqdm
import imageio
from IPython.display import Image
from scipy import ndimage
style.use('ggplot')

# Loading all the images from the drive
videos_images = []

for path in tqdm(natsorted(glob('/content/drive/My Drive/ES666CV/videos/D/*'))):
    sub_path = path + '/*'
    video_frames = []
    for files in natsorted(glob(sub_path)):
        video_frames.append(cv2.imread(files, 1))
    video_frames = np.array(video_frames)
    videos_images.append(video_frames)

print(f"Loaded {len(videos_images)} videos.")

# videos_images = np.array(video_frames) # Only possible because all images are of same size

100%|██████████| 8/8 [00:05<00:00,  1.58it/s]

Loaded 8 videos.

def show_image_grid(images, M, N, title='Title', figsize=8):
    # Assuming 'images' is a numpy array of shape (num_images, height, width, channels)
    if M==1:
        row_size = figsize
        col_size = figsize//4
    elif N==1:
        row_size = figsize//4
        col_size = figsize
    else:
        row_size, col_size = figsize, figsize

    fig, axes = plt.subplots(M, N, figsize=(row_size, col_size))

    if len(images.shape) < 4:
        images = np.expand_dims(images.copy(), axis=0)

    fig.suptitle(title)
    for i in range(M):
        for j in range(N):
            if M==1 and N==1:
                ax = axes
            elif M == 1 or N==1:
                ax = axes[max(i, j)]
            else:
                ax = axes[i, j]
            index = i * N + j
            if index < images.shape[0]:
                ax.imshow(cv2.cvtColor(images[index], cv2.COLOR_BGR2RGB))
            ax.axis('off')
    plt.tight_layout()
    plt.show()

def images_to_gif(frames, video_id):
    with imageio.get_writer(f"{video_id}.gif", mode="I", fps=24) as writer:
        for idx, frame in enumerate(frames):
            frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
            writer.append_data(frame)

def show_gif(video_id):
    with open(f"/content/{video_id}.gif",'rb') as f:
        display(Image(data=f.read(), format='png'))

# Preview the raw scrolls (videos 0-7)
for video_idx, video_frames in enumerate(tqdm(videos_images)):
    images_to_gif(video_frames, video_idx)
    show_gif(video_idx)

from scipy.signal import convolve2d
import cv2
import numpy as np

def optical_flow(frames, video_id):
    # Convert all frames to normalized grayscale
    gray_frames = [cv2.cvtColor(f, cv2.COLOR_BGR2GRAY).astype(np.float32) / 255.0 for f in frames]

    # Define derivative kernels
    kernel_x = np.array([[-1, 1],
                         [-1, 1]], dtype=np.float32) * 0.25
    kernel_y = np.array([[-1, -1],
                         [1, 1]], dtype=np.float32) * 0.25
    kernel_t1 = np.ones((2, 2), dtype=np.float32) * 0.25
    kernel_t2 = -kernel_t1

    output_frames = []

    # Process consecutive frame pairs
    for i in range(len(gray_frames) - 1):
        I1, I2 = gray_frames[i], gray_frames[i + 1]

        # Compute gradients using convolution
        Ix = (convolve2d(I1, kernel_x, boundary='symm', mode='same') +
              convolve2d(I2, kernel_x, boundary='symm', mode='same'))
        Iy = (convolve2d(I1, kernel_y, boundary='symm', mode='same') +
              convolve2d(I2, kernel_y, boundary='symm', mode='same'))
        It = (convolve2d(I2, kernel_t1, boundary='symm', mode='same') +
              convolve2d(I1, kernel_t2, boundary='symm', mode='same'))

        # Initialize optical flow fields
        u, v = np.zeros_like(I1), np.zeros_like(I1)
        window_size = 5
        w = window_size // 2

        # Estimate flow vectors per local window
        for y in range(w, I1.shape[0] - w):
            for x in range(w, I1.shape[1] - w):
                Ix_local = Ix[y - w:y + w + 1, x - w:x + w + 1].flatten()
                Iy_local = Iy[y - w:y + w + 1, x - w:x + w + 1].flatten()
                It_local = It[y - w:y + w + 1, x - w:x + w + 1].flatten()

                A = np.vstack((Ix_local, Iy_local)).T
                b = -It_local

                ATA = A.T @ A
                ATb = A.T @ b

                # Solve only if matrix is well-conditioned
                if np.linalg.det(ATA) >= 1e-5:
                    nu = np.linalg.inv(ATA) @ ATb
                    u[y, x], v[y, x] = nu[0], nu[1]

        # Prepare visualization frame
        vis = cv2.normalize(I1, None, 0, 255, cv2.NORM_MINMAX).astype(np.uint8)
        vis = cv2.cvtColor(vis, cv2.COLOR_GRAY2BGR)

        # Draw motion vectors (red arrows)
        step = 8
        for y in range(0, vis.shape[0], step):
            for x in range(0, vis.shape[1], step):
                if np.hypot(u[y, x], v[y, x]) > 0.5:
                    end_x = int(x + u[y, x] * 5)
                    end_y = int(y + v[y, x] * 5)
                    cv2.arrowedLine(vis, (x, y), (end_x, end_y),
                                    (0, 0, 255), 1, tipLength=0.3)

        output_frames.append(vis)

    # Save visualization as GIF
    optical_flow_frame = output_frames
    images_to_gif(optical_flow_frame, f"{video_id}_optical")

for video_idx, video_frames in enumerate(tqdm(videos_images)):
    optical_flow(video_frames, video_idx)

100%|██████████| 8/8 [17:19<00:00, 129.88s/it]

for video_idx in tqdm(range(len(videos_images))):
    show_gif(str(video_idx)+'_optical')

from scipy import signal
import numpy as np
import cv2

def optical_flow_consecutive(im1, im2, window_size, threshold=1e-2):
    """
    Estimate dense optical flow (u, v) between two consecutive images using the Lucas-Kanade method.

    Steps:
    1. Compute spatial (Ix, Iy) and temporal (It) image gradients using convolution filters.
    2. For each pixel, collect gradients from its local neighborhood (window_size × window_size).
    3. Solve the least-squares system A·[u, v]^T = -b for motion vectors.
    4. Ensure numerical stability using Shi-Tomasi’s criterion (smallest eigenvalue > threshold).

    Args:
        im1 (np.ndarray): Frame at time t.
        im2 (np.ndarray): Frame at time t+1.
        window_size (int): Size of the local neighborhood window.
        threshold (float): Eigenvalue threshold for well-conditioned regions.
    """

    # Convert both frames to grayscale and normalize to [0,1]
    im1 = cv2.cvtColor(im1, cv2.COLOR_BGR2GRAY) / 255.0
    im2 = cv2.cvtColor(im2, cv2.COLOR_BGR2GRAY) / 255.0

    half_w = window_size // 2

    # Gradient kernels
    kernel_x = np.array([[-1., 1.], [-1., 1.]])
    kernel_y = np.array([[-1., -1.], [1., 1.]])
    kernel_t = np.array([[1., 1.], [1., 1.]])

    # Compute derivatives
    Ix = signal.convolve2d(im1, kernel_x, boundary='symm', mode='same')
    Iy = signal.convolve2d(im1, kernel_y, boundary='symm', mode='same')
    It = signal.convolve2d(im2, kernel_t, boundary='symm', mode='same') \
       + signal.convolve2d(im1, -kernel_t, boundary='symm', mode='same')

    # Initialize optical flow fields
    u = np.zeros_like(im1)
    v = np.zeros_like(im1)

    # Lucas-Kanade per-pixel estimation
    for i in range(half_w, im1.shape[0] - half_w):
        for j in range(half_w, im1.shape[1] - half_w):
            # Extract local window patches
            Ix_patch = Ix[i-half_w:i+half_w+1, j-half_w:j+half_w+1].flatten()
            Iy_patch = Iy[i-half_w:i+half_w+1, j-half_w:j+half_w+1].flatten()
            It_patch = It[i-half_w:i+half_w+1, j-half_w:j+half_w+1].flatten()

            # Construct system A·v = -b
            A = np.vstack((Ix_patch, Iy_patch)).T
            b = It_patch.reshape(-1, 1)

            # Check conditioning using minimum eigenvalue
            if np.min(np.linalg.eigvals(A.T @ A)) < threshold:
                continue

            # Solve for [u, v]
            flow = np.linalg.pinv(A) @ b
            u[i, j] = flow[0, 0]
            v[i, j] = flow[1, 0]

    return u, v, Ix, Iy, It

def draw_on_frame(frame, U, V, color=(0, 255, 0), scale=5, step_size=10, magnitude_threshold=1.0):
    """
    Draw flow vectors as arrows on an image using OpenCV.
    Arrows are drawn only for significant motion magnitudes.
    """
    line_color = color
    max_magnitude = np.sqrt(np.max(U**2 + V**2))

    for i in range(0, frame.shape[0], step_size):
        for j in range(0, frame.shape[1], step_size):
            u, v = U[i, j], V[i, j]
            magnitude = np.sqrt(u**2 + v**2)

            # Skip weak motions
            if magnitude > magnitude_threshold * max_magnitude:
                # Normalize and scale the arrow length
                u_scaled = (u / max_magnitude) * scale
                v_scaled = (v / max_magnitude) * scale
                cv2.arrowedLine(
                    frame,
                    (j, i),
                    (int(round(j + u_scaled)), int(round(i + v_scaled))),
                    line_color,
                    1,
                    tipLength=0.3
                )
    return frame

def overlay_flow_on_frame(frame, u, v, color, step=10, scale=1):
    """
    Overlay optical flow vectors on a frame using matplotlib's quiver plot.
    Returns a new frame with quiver arrows drawn on it.
    """
    # Prepare coordinate grids
    y, x = np.mgrid[0:u.shape[0], 0:u.shape[1]]

    # Downsample vectors for clarity
    x_ds = x[::step, ::step]
    y_ds = y[::step, ::step]
    u_ds = u[::step, ::step]
    v_ds = v[::step, ::step]

    # Convert to RGB for visualization
    frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
    plt.figure(figsize=(10, 10))
    plt.imshow(frame_rgb)

    plt.quiver(
        x_ds, y_ds, u_ds, v_ds,
        color=color, angles='xy',
        scale_units='xy', scale=scale
    )
    plt.axis('off')
    plt.savefig("temp_overlay.png", bbox_inches='tight', pad_inches=0)
    plt.close()

    overlay_frame = cv2.imread("temp_overlay.png")
    return overlay_frame

def optical_flow(frames, video_id, scale=1):
    """
    Compute optical flow between consecutive frames and visualize as arrowed overlays.
    Creates and saves a GIF of all overlay frames.
    """
    optical_flow_frames = []

    for i in range(len(frames) - 1):
        im1, im2 = frames[i], frames[i + 1]
        u, v, _, _, _ = optical_flow_consecutive(im1, im2, 15)

        # Adjust visualization settings per video ID
        if video_id < 6 and video_id != 1:
            overlay = overlay_flow_on_frame(im1, u, v, "red", 5, 0.5)
        elif video_id == 1:
            overlay = overlay_flow_on_frame(im1, u, v, "red", 5, 0.2)
        elif video_id in [6, 7]:
            overlay = overlay_flow_on_frame(im1, u, v, "blue", 8, 0.5)
        elif video_id == 8:
            overlay = overlay_flow_on_frame(im1, u, v, "yellow", 5, 0.3)
        elif video_id == 9:
            overlay = overlay_flow_on_frame(im1, u, v, "blue", 10, 0.9)
        elif video_id == 10:
            overlay = overlay_flow_on_frame(im1, u, v, "red", 10, 0.8)
        else:
            overlay = overlay_flow_on_frame(im1, u, v, "red", 5, 0.5)

        optical_flow_frames.append(overlay)

    images_to_gif(optical_flow_frames, f"{video_id}_optical")

for video_idx, video_frames in enumerate(tqdm(videos_images)):
    optical_flow(video_frames, video_idx)

100%|██████████| 8/8 [1:06:56<00:00, 502.09s/it]

for video_idx in tqdm(range(len(videos_images))):
    show_gif(str(video_idx)+'_optical')

from scipy.signal import convolve2d
from scipy import ndimage
from scipy.ndimage import map_coordinates
from skimage.metrics import peak_signal_noise_ratio as psnr
import numpy as np
import cv2

def optical_flow_warping(frame_a, frame_b):
    """
    Warp frame_a toward frame_b using optical flow computed via the Lucas–Kanade method.
    Returns the warped image and prints the PSNR between the warped result and frame_b.
    """

    # --- Convert frames to normalized grayscale ---
    I1 = cv2.cvtColor(frame_a, cv2.COLOR_BGR2GRAY).astype(np.float32) / 255.0
    I2 = cv2.cvtColor(frame_b, cv2.COLOR_BGR2GRAY).astype(np.float32) / 255.0

    # --- Spatial and temporal derivative kernels ---
    kernel_x = np.array([[-1, 1], [-1, 1]]) * 0.25
    kernel_y = np.array([[-1, -1], [1, 1]]) * 0.25
    kernel_t1 = np.ones((2, 2)) * 0.25
    kernel_t2 = -kernel_t1

    # --- Compute derivatives ---
    Ix = convolve2d(I1, kernel_x, boundary='symm', mode='same') + convolve2d(I2, kernel_x, boundary='symm', mode='same')
    Iy = convolve2d(I1, kernel_y, boundary='symm', mode='same') + convolve2d(I2, kernel_y, boundary='symm', mode='same')
    It = convolve2d(I2, kernel_t1, boundary='symm', mode='same') + convolve2d(I1, kernel_t2, boundary='symm', mode='same')

    # --- Lucas–Kanade flow estimation (windowed least squares) ---
    window = 5
    W = np.ones((window, window))
    Ix2 = ndimage.convolve(Ix * Ix, W, mode='reflect')
    Iy2 = ndimage.convolve(Iy * Iy, W, mode='reflect')
    Ixy = ndimage.convolve(Ix * Iy, W, mode='reflect')
    Ixt = ndimage.convolve(Ix * It, W, mode='reflect')
    Iyt = ndimage.convolve(Iy * It, W, mode='reflect')

    det = Ix2 * Iy2 - Ixy**2
    det[det == 0] = 1e-10  # avoid divide-by-zero
    u = (-Iy2 * Ixt + Ixy * Iyt) / det
    v = (Ixy * Ixt - Ix2 * Iyt) / det

    # --- Backward warping: sample pixels from I1 using flow vectors ---
    h, w = I1.shape
    X, Y = np.meshgrid(np.arange(w), np.arange(h))
    Xb = np.clip(X + u, 0, w - 1)
    Yb = np.clip(Y + v, 0, h - 1)

    warped_gray = map_coordinates(I1, [Yb, Xb], order=1, mode='reflect')
    warped_image = cv2.cvtColor((warped_gray * 255).astype(np.uint8), cv2.COLOR_GRAY2BGR)

    # --- Compare similarity ---
    psnr_value = psnr(I2, warped_gray)
    print(f"PSNR: {psnr_value:.2f} dB")

    return warped_image

for video_idx, video_frames in enumerate(tqdm(videos_images)):
    i = 1
    warped_image = optical_flow_warping(video_frames[i], video_frames[i+8])
    show_image_grid(np.array([video_frames[i+8], warped_image]), 1, 2, 'Warp Image Comparison', figsize=16)

  0%|          | 0/8 [00:00<?, ?it/s]

PSNR: 25.45 dB

 12%|█▎        | 1/8 [00:00<00:02,  3.00it/s]

PSNR: 27.66 dB

 25%|██▌       | 2/8 [00:00<00:02,  2.81it/s]

PSNR: 23.10 dB

 38%|███▊      | 3/8 [00:01<00:01,  2.79it/s]

PSNR: 22.92 dB

 50%|█████     | 4/8 [00:01<00:01,  2.99it/s]

PSNR: 16.60 dB

def inverse_warp_image_from_scratch(frame, u, v, current_time, other_time, target_time):
    """
    Warp an image using inverse optical flow fields without external interpolation libraries.

    Args:
        frame (np.ndarray): Grayscale image to warp.
        u (np.ndarray): Horizontal optical flow field.
        v (np.ndarray): Vertical optical flow field.
        current_time (float): The time of the current frame.
        other_time (float): The time of the other frame (frame we are warping towards).
        target_time (float): The time of the target frame (interpolated frame).

    Returns:
        np.ndarray: Warped image.
    """
    h, w = frame.shape[:2]
    warped_image = np.zeros_like(frame, dtype=np.float32)

    time_scale = (target_time - current_time) / (other_time - current_time)

    # Iterate over all pixels in the target (warped) image
    for y in range(h):
        for x in range(w):
            # Compute the source (original) pixel location using inverse flow
            x_orig = x - u[y, x] * time_scale
            y_orig = y - v[y, x] * time_scale

            # Ensure that the original pixel location is within bounds
            if x_orig < 0 or x_orig >= w - 1 or y_orig < 0 or y_orig >= h - 1:
                continue

            x0, y0 = int(np.floor(x_orig)), int(np.floor(y_orig))
            x1, y1 = min(x0 + 1, w - 1), min(y0 + 1, h - 1)

            dx, dy = x_orig - x0, y_orig - y0

            # bilinear interpolation
            warped_image[y, x] = ((1 - dx) * (1 - dy) * frame[y0, x0] + dx * (1 - dy) * frame[y0, x1] + (1 - dx) * dy * frame[y1, x0] + dx * dy * frame[y1, x1])

    return np.clip(warped_image, 0, 255)

def optical_flow_warping(frame_a, frame_b, start_time, end_time, target_time):
    """
    Perform optical flow-based warping to interpolate a frame at target_time.

    Args:
        frame_a (np.ndarray): First frame.
        frame_b (np.ndarray): Second frame.
        start_time (float): Time of frame_a.
        end_time (float): Time of frame_b.
        target_time (float): Target time for the interpolated frame.

    Returns:
        np.ndarray: Warped interpolated frame.
    """
    # Compute optical flow from frame_a to frame_b (forward)
    U_front, V_front, _, _, _ = optical_flow_consecutive(frame_a, frame_b, 15)
    warped_frame_forward = inverse_warp_image_from_scratch(frame_a, U_front, V_front, start_time, end_time, target_time).astype(np.uint8)

    # Compute optical flow from frame_b to frame_a (backward)
    U_back, V_back, _, _, _ = optical_flow_consecutive(frame_b, frame_a, 15)
    warped_frame_backward = inverse_warp_image_from_scratch(frame_b, -U_back, -V_back, end_time, start_time, target_time).astype(np.uint8)

    return warped_frame_forward, warped_frame_backward

for video_idx, video_frames in enumerate(tqdm(videos_images)):
    i = 1
    warped_image, _ = optical_flow_warping(video_frames[i], video_frames[i+8], start_time=i, end_time = i + 8, target_time= i + 8)
    show_image_grid(np.array([video_frames[i+8], warped_image]), 1, 2, 'Warp Image Comparison', figsize=16)

encrypted_gate = cv2.imread('/content/drive/MyDrive/ES666CV/videos/Decode_Message/encoded.png')
encrypted_gate = cv2.cvtColor(encrypted_gate, cv2.COLOR_BGR2RGB)

# Display
plt.figure(figsize=(8, 6))
plt.imshow(encrypted_gate)
plt.axis('off')
plt.show()

import cv2
import numpy as np
import matplotlib.pyplot as plt

# Load and convert to RGB
encrypted_gate = cv2.imread('/content/drive/MyDrive/ES666CV/videos/Decode_Message/encoded.png')
encrypted_gate = cv2.cvtColor(encrypted_gate, cv2.COLOR_BGR2RGB)

# Step 1: Extract only the least significant bit (LSB) of each channel
lsb = encrypted_gate & 1  # keeps only last bit of each channel (R,G,B)

# Step 2: Combine bits to visualize hidden structure
# You can scale it up so it’s visible as 0 or 255
hidden_image = (lsb * 255).astype(np.uint8)

plt.figure(figsize=(8,6))
plt.imshow(hidden_image)
plt.axis('off')
plt.show()

# Step 3: If the hidden text is encoded in grayscale:
gray_hidden = cv2.cvtColor(hidden_image, cv2.COLOR_RGB2GRAY)
plt.figure(figsize=(8,6))
plt.imshow(gray_hidden, cmap='gray')
plt.axis('off')
plt.show()

🌀 Gate IV – The Flux of Motion: Currents and Bridges¶

🎯 Mission Objectives¶

Pre-defined Code¶

Task 1: Lucas-Kanade – Gripping the River's Currents¶

The Guardian's Tomes (References as Ancient Scrolls)¶

Lucas–Kanade Optical Flow: Theory & Mathematics¶

1. Brightness Constancy Assumption¶

2. Local Window Solution¶

For each pixel, consider a local window $ W $ and solve for $ (u, v) $: $ \sum_{(x, y) \in W} \begin{bmatrix} I_x^2 & I_x I_y \\ I_x I_y & I_y^2 \end{bmatrix} \begin{bmatrix} u \\ v \end{bmatrix}¶

3. Least-Squares Solution¶

Color and all frames(Extra)¶

Task 2: Optical Flow Warping – Bridging the River's Waves¶

Guardian Tomes¶

Color(Extra)¶

🔮 The Final Curiosity Rite – Decoding the Hidden Gate¶

🏁 Epilogue – The World Reconstructed¶