- name: Install the latest version of uv
  uses: astral-sh/setup-uv@v7

# boilerplate setup
%load_ext autoreload
%autoreload 2

%matplotlib inline

import os
import sys

src_path = os.path.abspath("../src")
if (src_path not in sys.path):
    sys.path.insert(0, src_path)

# Library imports
import numpy as np
import imageio.v3 as imageio
import matplotlib.pyplot as plt
import skimage as skim
import cv2

# codebase imports
import util
import filtering
import features
import geometry

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload

left = util.imread_grayfloat("../data/flowers_left.png")
right = util.imread_grayfloat("../data/flowers_right.png")

util.imshow_gray(np.vstack((left, right)))

# patch = left[115:125, 205:215]
# patch = left[55:61, 102:107]
patch = left[0:35, 45:80]

util.imshow_gray(patch)

def fast_filter(img, filter):
    return cv2.filter2D(img, -1, filter)

kernel = patch - patch.mean()
xcorr_out = fast_filter(right-right.mean(), patch-patch.mean())
plt.imshow(np.vstack([right, xcorr_out/xcorr_out.max()]))

<matplotlib.image.AxesImage at 0x126e433e0>

import tqdm

def ncc_cost(left_patch, right_patch):
    lp = left_patch - left_patch.mean()
    rp = right_patch - right_patch.mean()
    lp /= lp.std()
    rp /= rp.std()
    return (lp * rp).sum()

def ssd_cost(left_patch, right_patch):
    return np.sum((left_patch - right_patch)**2)

def sad_cost(left_patch, right_patch):
    return np.sum(np.abs(left_patch - right_patch))

H, W = left.shape
window = 5
hw = window // 2

COST = "NCC"

disparity_img = np.zeros_like(left)

disparity_limit = 60

for i in tqdm.tqdm(range(hw, H-hw)): # for each row
    low_i = i-hw
    high_i = i+hw+1
    for j in range(hw, W-hw): # for each column within a local window
        low_j = j-hw
        high_j = j+hw+1
        
        # extract the left patch:
        left_patch = left[low_i:high_i, low_j:high_j] 
        
        costs = 1e5 * np.ones((disparity_limit*2+1)) #initialize costs
        for d in range(-disparity_limit, disparity_limit+1): # for each possible disparity
            if 0 <= low_j+d and high_j+d <= W:
                
                # extract a right patch at the current disparity
                right_patch = right[low_i:high_i, low_j+d:high_j+d]

                # compute the cost                
                if COST == "NCC":
                    c = -ncc_cost(left_patch, right_patch)
                elif COST == "SSD":
                    c = ssd_cost(left_patch, right_patch)
                elif COST == "SAD":
                    c = sad_cost(left_patch, right_patch)

                costs[d + disparity_limit] = c
        
        # set the disparity to the one with lowest cost
        disparity_img[i,j] = np.argmin(costs) - disparity_limit

plt.imshow(np.vstack([left, disparity_img/disparity_img.max()]))
plt.colorbar()

100%|█████████████████████████████████████████████████████████████| 120/120 [00:54<00:00,  2.20it/s]

<matplotlib.colorbar.Colorbar at 0x127461160>

np.set_printoptions(suppress=True) # suppress scientific notation

points = np.array([
    [0, 0, -200],
    [-20, 50, -200],
    [-100, 100, -200]
], dtype=np.float64).T

# HW 3: fill in your intrinsics matrix here:
K = np.array([
    [1, 0, 0],
    [0, 1, 0],
    [0, 0, 1]
], dtype=np.float64)

# HW 3: verify that K @ points yields the expected pixel coordiantes
# apply k to points to get points_img

# HW 5: write down the camera frame matrix 
cam_center = np.array([200, 0, -200], dtype=np.float64)
frame = np.array([
    [1, 0, 0, 0],
    [0, 1, 0, 0],
    [0, 0, 1, 0],
    [0, 0, 0, 1]
], dtype=np.float64)
frame

np.linalg.inv(frame)

# make the 3D points into 3D homogeneous points so they can be translated
points_4d = np.ones((4, 3))
points_4d[:3, :] = points
points_4d

# HW 6: Apply the inverse frame matrix to get world coordinates to camera coordinates
# apply inv(frame) to points_4d and normalize; store them in pts_cam

# make the intrinsics 3x4 so it drops the 4th dimension
K4d = np.zeros((3, 4))
K4d[:3,:3] = K
K4d

# HW7: find the final pixel locations of the points in the transformed camera
# apply K4d to pts_cam and store in pts_img

Lecture 12¶

Announcements¶

Goals¶

Outline¶

HW #2¶

HW #3¶

HW #4¶

HW #5¶

HW #6¶

HW #7¶