import imageio.v3 as iio
import matplotlib.pyplot as plt
import numpy as np


def compare(*images):
    """Display one or more images side by side."""
    _, axs = plt.subplots(1, len(images), figsize=(15, 6))
    for ax, image in zip(axs, images):
        ax.imshow(image, cmap="gray")
    plt.show()

# Read image as grayscale
dubs = iio.imread("dubs.jpg", mode="L")
plt.imshow(dubs, cmap="gray");

dubs[100, 100]

242

f(100, 100) = 242

%%html
<iframe width="640" height="360" src="https://www.youtube-nocookie.com/embed/KuXjwB4LzSA?start=538&end=588" title="YouTube video player" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture; web-share" allowfullscreen></iframe>

np.ones((3, 3))

array([[1., 1., 1.],
       [1., 1., 1.],
       [1., 1., 1.]])

box_blur_3x3 = 1 / 9 * np.ones((3, 3))
box_blur_3x3

array([[0.11111111, 0.11111111, 0.11111111],
       [0.11111111, 0.11111111, 0.11111111],
       [0.11111111, 0.11111111, 0.11111111]])

def get_subimages(image, kernel_shape):
    """Returns an array of subimages matching the given kernel shape."""
    image_h, image_w = image.shape
    kernel_h, kernel_w = kernel_shape
    subimages_h = image_h - kernel_h + 1
    subimages_w = image_w - kernel_w + 1
    subimages = np.zeros((subimages_h, subimages_w, kernel_h, kernel_w))
    for ih in range(subimages_h):
        for iw in range(subimages_w):
            # subimages[ih, iw] = image[iw:iw + kernel_w,     ih:ih + kernel_h]
            # subimages[ih, iw] = image[iw:iw + kernel_w + 1, ih:ih + kernel_h + 1]
            subimages[ih, iw] = image[ih:ih + kernel_h,     iw:iw + kernel_w]
            # subimages[ih, iw] = image[ih:ih + kernel_h + 1, iw:iw + kernel_w + 1]
    return subimages

dubs_eye = dubs[50:100, 300:350]
plt.imshow(dubs_eye, cmap="gray");

dubs_eye_subimages = get_subimages(dubs_eye, (3, 3))
compare(dubs_eye_subimages[(30, 20)], dubs_eye[30:33, 20:23])
assert np.allclose(dubs_eye_subimages[(30, 20)], dubs_eye[30:33,20:23])

def convolve(image, kernel):
    """Returns the convolution of the image and kernel where the image shrinks by kernel shape."""
    subimages = get_subimages(image, kernel.shape)
    subimages_h, subimages_w = subimages.shape[:2]
    result = np.zeros((subimages_h, subimages_w))
    for ih in range(subimages_h):
        for iw in range(subimages_w):
            # TODO: compute the sum of element-wise product between subimage and kernel
            result[ih, iw] = (subimages[ih, iw] * kernel).sum()
    return result


dubs_blurred = convolve(dubs, box_blur_3x3)
compare(dubs, dubs_blurred)

dubs_eye_subimages[(30, 20)], box_blur_3x3

(array([[123., 166.,  76.],
        [ 61., 120., 110.],
        [ 31.,  58., 103.]]),
 array([[0.11111111, 0.11111111, 0.11111111],
        [0.11111111, 0.11111111, 0.11111111],
        [0.11111111, 0.11111111, 0.11111111]]))

dubs_eye_subimages[(30, 20)] * box_blur_3x3

array([[13.66666667, 18.44444444,  8.44444444],
       [ 6.77777778, 13.33333333, 12.22222222],
       [ 3.44444444,  6.44444444, 11.44444444]])

(dubs_eye_subimages[(30, 20)] * box_blur_3x3).sum()

94.22222222222221

np.dot(dubs_eye_subimages[(30, 20)], box_blur_3x3)

array([[40.55555556, 40.55555556, 40.55555556],
       [32.33333333, 32.33333333, 32.33333333],
       [21.33333333, 21.33333333, 21.33333333]])

dubs_eye_subimages[(30, 20)] @ box_blur_3x3

array([[40.55555556, 40.55555556, 40.55555556],
       [32.33333333, 32.33333333, 32.33333333],
       [21.33333333, 21.33333333, 21.33333333]])

box_blur_10x10 = np.ones((10, 10))
box_blur_10x10 /= box_blur_10x10.size
box_blur_10x10

array([[0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01],
       [0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01],
       [0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01],
       [0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01],
       [0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01],
       [0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01],
       [0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01],
       [0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01],
       [0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01],
       [0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01, 0.01]])

dubs_blurred_10x10 = convolve(dubs, box_blur_10x10)
compare(dubs, dubs_blurred_10x10)

kernel = np.zeros((3, 3))
kernel[1, 1] = 1
kernel

array([[0., 0., 0.],
       [0., 1., 0.],
       [0., 0., 0.]])

compare(dubs, convolve(dubs, kernel))

# Setup the previous kernel
kernel = np.zeros((3, 3))
kernel[1, 1] = 1
# Double the previous kernel minus the box blur kernel
kernel = 2 * kernel - box_blur_3x3
kernel

array([[-0.11111111, -0.11111111, -0.11111111],
       [-0.11111111,  1.88888889, -0.11111111],
       [-0.11111111, -0.11111111, -0.11111111]])

compare(dubs, convolve(dubs, kernel))

values = [[1, 2, 4, 7, 11, 11, 7, 4, 2, 1]]
kernel = np.array(values) * np.array(values).T
kernel = kernel / kernel.sum()
# Show values rounded to two decimal places
kernel.round(2)

array([[0.  , 0.  , 0.  , 0.  , 0.  , 0.  , 0.  , 0.  , 0.  , 0.  ],
       [0.  , 0.  , 0.  , 0.01, 0.01, 0.01, 0.01, 0.  , 0.  , 0.  ],
       [0.  , 0.  , 0.01, 0.01, 0.02, 0.02, 0.01, 0.01, 0.  , 0.  ],
       [0.  , 0.01, 0.01, 0.02, 0.03, 0.03, 0.02, 0.01, 0.01, 0.  ],
       [0.  , 0.01, 0.02, 0.03, 0.05, 0.05, 0.03, 0.02, 0.01, 0.  ],
       [0.  , 0.01, 0.02, 0.03, 0.05, 0.05, 0.03, 0.02, 0.01, 0.  ],
       [0.  , 0.01, 0.01, 0.02, 0.03, 0.03, 0.02, 0.01, 0.01, 0.  ],
       [0.  , 0.  , 0.01, 0.01, 0.02, 0.02, 0.01, 0.01, 0.  , 0.  ],
       [0.  , 0.  , 0.  , 0.01, 0.01, 0.01, 0.01, 0.  , 0.  , 0.  ],
       [0.  , 0.  , 0.  , 0.  , 0.  , 0.  , 0.  , 0.  , 0.  , 0.  ]])

np.array(values)

array([[ 1,  2,  4,  7, 11, 11,  7,  4,  2,  1]])

np.array(values).T

array([[ 1],
       [ 2],
       [ 4],
       [ 7],
       [11],
       [11],
       [ 7],
       [ 4],
       [ 2],
       [ 1]])

compare(dubs, convolve(dubs, kernel))

compare(dubs_blurred_10x10, convolve(dubs, kernel))

def template_match(image, template):
    """
    Given a grayscale image and template, returns a numpy array that stores the similarity of the
    template at each position in the image.
    """
    image_h, image_w = image.shape
    template_h, template_w = template.shape

    # De-mean the template
    demeaned_template = template - template.mean()

    # Construct result of the expected output size
    result_h = image_h - template_h + 1
    result_w = image_w - template_w + 1
    result = np.zeros((result_h, result_w))

    for ih in range(result_h):
        for iw in range(result_w):
            # Select corresponding subimage
            subimage = image[ih:ih+template_h, iw:iw+template_w]

            # De-mean the subimage
            demeaned_subimage = subimage - subimage.mean()

            # Compute sum of element-wise products
            similarity = (demeaned_template * demeaned_subimage).sum()
            result[ih, iw] = similarity

    return result


match = template_match(dubs, dubs_eye)
compare(dubs, match)
np.unravel_index(match.argmax(), match.shape)

(50, 300)

Convolutions¶

Convolutions as mathematical operators¶

Practice: Get subimages¶

Practice: Sum of element-wise products¶

Understanding kernels¶

Practice: Template match¶