# boilerplate setup
%load_ext autoreload
%autoreload 2

%matplotlib inline

import os
import sys

src_path = os.path.abspath("../src")
if (src_path not in sys.path):
    sys.path.insert(0, src_path)

# Library imports
import numpy as np
import imageio.v3 as imageio
import matplotlib.pyplot as plt
import skimage as skim
import cv2

# codebase imports
import util
import filtering
import features
import geometry

left = util.imread_grayfloat("../data/flowers_left.png")
right = util.imread_grayfloat("../data/flowers_right.png")

util.imshow_gray(np.vstack((left, right)))

# patch = left[115:125, 205:215]
# patch = left[55:61, 102:107]
patch = left[0:35, 45:80]

util.imshow_gray(patch)

def fast_filter(img, filter):
    return cv2.filter2D(img, -1, filter)

kernel = patch - patch.mean()
xcorr_out = fast_filter(right-right.mean(), patch-patch.mean())
plt.imshow(np.vstack([right, xcorr_out/xcorr_out.max()]))

<matplotlib.image.AxesImage at 0x7faeed6006d0>

import tqdm

def ncc_cost(left_patch, right_patch):
    lp = (left_patch - left_patch.mean()) / left_patch.std()
    rp = (right_patch - right_patch.mean()) / right_patch.std()
    return (lp * rp).sum()

def ssd_cost(left_patch, right_patch):
    return np.sum((left_patch - right_patch)**2)

def sad_cost(left_patch, right_patch):
    return np.sum(np.abs(left_patch - right_patch))

H, W = left.shape
window = 5
hw = window // 2

disparity_img = np.zeros_like(left)

disparity_limit = 60


for i in tqdm.tqdm(range(hw, H-hw)):
    low_i = i-hw
    high_i = i+hw+1
    for j in range(hw, W-hw):
        low_j = j-hw
        high_j = j+hw+1
        left_patch = left[low_i:high_i, low_j:high_j]
        costs = 1e5 * np.ones((disparity_limit*2+1))
        for d in range(-disparity_limit, disparity_limit+1): # disparities
            if 0 <= low_j+d and high_j+d <= W:
                right_patch = right[low_i:high_i, low_j+d:high_j+d]
                costs[d + disparity_limit] = ssd_cost(left_patch, right_patch)
        disparity_img[i,j] = np.argmin(costs) - disparity_limit

plt.imshow(np.vstack([left, disparity_img/disparity_img.max()]))
plt.colorbar()

100%|████████████████████████████████████████████████████████████████████| 120/120 [00:11<00:00, 10.84it/s]

<matplotlib.colorbar.Colorbar at 0x7faeec287d50>

np.set_printoptions(suppress=True) # suppress scientific notation

points = np.array([
    [0, 0, -200],
    [-20, 50, -200],
    [-100, 100, -200]
], dtype=np.float64).T

# HW 3: fill in your intrinsics matrix here:
K = np.array([
    [-100, 0, 50],
    [0, 100, 50],
    [0, 0, 1]
], dtype=np.float64)

# HW 3: verify that K @ points yields the expected pixel coordiantes
points_img = K @ points
points_img = points_img / points_img[2,:]
points_img

array([[50., 40., -0.],
       [50., 25., -0.],
       [ 1.,  1.,  1.]])

# HW 5: write down the camera frame matrix 
cam_center = np.array([200, 0, -200], dtype=np.float64)
frame = np.array([
    [0, 0, 1, 200],
    [0, 1, 0,   0],
    [-1,0, 0,-200],
    [0, 0, 0, 1]
], dtype=np.float64)
frame

array([[   0.,    0.,    1.,  200.],
       [   0.,    1.,    0.,    0.],
       [  -1.,    0.,    0., -200.],
       [   0.,    0.,    0.,    1.]])

# make the 3D points into 3D homogeneous points so they can be translated
points_4d = np.ones((4, 3))
points_4d[:3, :] = points
points_4d

array([[   0.,  -20., -100.],
       [   0.,   50.,  100.],
       [-200., -200., -200.],
       [   1.,    1.,    1.]])

# HWS 6: Apply the inverse frame matrix to get world coordinates to camera coordinates
pts_cam = np.linalg.inv(frame) @ points_4d
pts_cam /= pts_cam[3,:]
pts_cam

array([[   0.,    0.,    0.],
       [   0.,   50.,  100.],
       [-200., -220., -300.],
       [   1.,    1.,    1.]])

# make the intrinsics 3x4 so it drops the 4th dimension
K4d = np.zeros((3, 4))
K4d[:3,:3] = K
K4d

array([[-100.,    0.,   50.,    0.],
       [   0.,  100.,   50.,    0.],
       [   0.,    0.,    1.,    0.]])

# HW7: find the final pixel locations of the points in the transformed camera
points_img = K4d @ pts_cam
points_img /= points_img[2,:]
print(points_img)

[[50.         50.         50.        ]
 [50.         27.27272727 16.66666667]
 [ 1.          1.          1.        ]]

Lecture 12¶

Announcements¶

Goals¶

Outline¶

HW #2¶

HW #3¶

HW #4¶

HW #5¶

HW #6¶

HW #7¶