import numpy as np
import matplotlib.pyplot as plt
from PIL import Image
import requests
from io import BytesIO

import numpy as np
import matplotlib.pyplot as plt
from PIL import Image
import requests
from io import BytesIO
%matplotlib inline

print("All imports successful!")

# IMAGE LOADER HELPER — run this cell as-is
# This gives you two PIL Image objects to work with throughout the notebook.

def load_color_image():
    """Downloads a small color image (a classic: Lena/Lenna test image alternative).
    Falls back to a synthetic image if download fails."""
    try:
        url = "https://upload.wikimedia.org/wikipedia/commons/thumb/3/3f/Bikesgray.jpg/320px-Bikesgray.jpg"
        response = requests.get(url, timeout=5)
        img = Image.open(BytesIO(response.content)).convert('RGB')
        return img
    except Exception:
        # Synthetic fallback: colorful gradient image
        arr = np.zeros((100, 100, 3), dtype=np.uint8)
        for r in range(100):
            for c in range(100):
                arr[r, c] = [r * 2, c * 2, 128]
        return Image.fromarray(arr)

def load_gray_image():
    """Downloads a small grayscale image.
    Falls back to a synthetic image if download fails."""
    try:
        url = "https://upload.wikimedia.org/wikipedia/commons/thumb/3/3f/Bikesgray.jpg/320px-Bikesgray.jpg"
        response = requests.get(url, timeout=5)
        img = Image.open(BytesIO(response.content)).convert('L')
        return img
    except Exception:
        arr = np.zeros((100, 100), dtype=np.uint8)
        for r in range(100):
            for c in range(100):
                arr[r, c] = (r + c) % 256
        return Image.fromarray(arr)

color_img = load_color_image()
gray_img  = load_gray_image()
print("Images loaded!")
print(f"Color image mode : {color_img.mode}")
print(f"Gray  image mode : {gray_img.mode}")

# DISPLAY HELPER — run this cell as-is
def show_images(images, titles=None, cmap_list=None, figsize=None):
    """
    Displays a list of images side by side.

    Parameters:
        images    : list of numpy arrays or PIL Images
        titles    : list of title strings
        cmap_list : list of colormaps (e.g. ['gray', None, 'hot'])
                    use None for color images, 'gray' for grayscale
        figsize   : optional (width, height) tuple
    """
    n = len(images)
    if figsize is None:
        figsize = (5 * n, 4)
    if titles is None:
        titles = [f'Image {i+1}' for i in range(n)]
    if cmap_list is None:
        cmap_list = [None] * n

    fig, axes = plt.subplots(1, n, figsize=figsize)
    if n == 1:
        axes = [axes]
    for ax, img, title, cmap in zip(axes, images, titles, cmap_list):
        if isinstance(img, Image.Image):
            img = np.array(img)
        ax.imshow(img, cmap=cmap)
        ax.set_title(title)
        ax.axis('off')
    plt.tight_layout()
    plt.show()

print("show_images() helper ready.")

# YOUR CODE HERE
# Display the color image
show_images([color_img], titles=['Color Image'])

# Display the grayscale image
# show_images([gray_img], titles=['Grayscale Image'], cmap_list=...)

# YOUR CODE HERE
color_arr = np.array(color_img)
gray_arr  = np.array(gray_img)

print("--- Color Array ---")
print("Shape:", color_arr.shape)   # What are these 3 numbers?
print("Dtype:", color_arr.dtype)
print("Min:",   color_arr.min(), "  Max:", color_arr.max())
print("Pixel at [0,0]:", color_arr[0, 0])         # What is this?
print("Red value at [0,0]:", color_arr[0, 0, 0])  # And this?

print("\n--- Grayscale Array ---")
print("Shape:", gray_arr.shape)
print("Dtype:", gray_arr.dtype)

print("\nFirst 5x5 block of grayscale:")
print(gray_arr[:5, :5])

# YOUR CODE HERE

# 1. Image dimensions
height = color_arr.shape[0]
width  = color_arr.shape[1]
print(f"Image size: {height} rows x {width} columns")

# 2. Center pixel
# center_row = ???
# center_col = ???
# print(color_arr[center_row, center_col])

# 3. Bottom-right corner pixel
# print(color_arr[???, ???])

# 4. First row of grayscale
# print(gray_arr[0, :])

# 5. Average brightness using ONLY Python loops
total = 0
count = 0
# YOUR LOOP HERE
# for r in range(...):
#     for c in range(...):
#         ...

avg_brightness = total / count if count > 0 else 0
print(f"Average brightness (manual loop): {avg_brightness:.2f}")
print(f"Verify with numpy:                {gray_arr.mean():.2f}")

# YOUR CODE HERE

# Top-left 20x20 patch
gray_patch = gray_arr[:20, :20]
show_images([gray_patch], titles=['Grayscale top-left 20x20'], cmap_list=['gray'])

# Color patch
# color_patch = color_arr[:20, :20]
# show_images(...)

# Middle patch — compute the middle coordinates first!
# mid_r = ???
# mid_c = ???
# gray_mid  = gray_arr[mid_r-10:mid_r+10, mid_c-10:mid_c+10]
# color_mid = color_arr[mid_r-10:mid_r+10, mid_c-10:mid_c+10]
# show_images([gray_mid, color_mid], ...)

# YOUR CODE HERE

# 1. Top-left pixel
print("Top-left pixel R,G,B:", color_arr[0, 0])

# 2. Build the 4x4 test array
test = np.zeros((4, 4, 3), dtype=np.uint8)
# Fill row 0 with red...
# YOUR CODE
show_images([test], titles=['Test 4x4 color array'])

# 3. Channel access
print("test[0,0,0] (Red of first pixel):   ", test[0, 0, 0])
print("test[1,0,1] (??? of second row):    ", test[1, 0, 1])

# YOUR CODE HERE

height = color_arr.shape[0]
width  = color_arr.shape[1]

red_channel = np.zeros((height, width), dtype=np.uint8)

# Loop over every pixel and extract Red value
for r in range(height):
    for c in range(width):
        pass  # red_channel[r, c] = ???

show_images([red_channel], titles=['Red Channel (as grayscale)'], cmap_list=['gray'])

# EXTRA: Extract Green and Blue channels the same way
green_channel = np.zeros((height, width), dtype=np.uint8)
blue_channel  = np.zeros((height, width), dtype=np.uint8)

# YOUR LOOPS HERE

# Display all three channels side by side
show_images(
    [red_channel, green_channel, blue_channel],
    titles=['Red', 'Green', 'Blue'],
    cmap_list=['Reds', 'Greens', 'Blues']
)

# YOUR CODE HERE

# Build red_image: (H, W, 3) with only red channel filled
red_image = np.zeros((height, width, 3), dtype=np.uint8)
for r in range(height):
    for c in range(width):
        pass  # red_image[r, c, 0] = ???

show_images([red_image], titles=['Red channel as color'])

# Build green_image and blue_image similarly
# ...

# Add them together — watch out for overflow!
# combined = ???

# METHOD 1: Average
def rgb_to_gray_average(arr):
    """
    Converts color image to grayscale using simple average: (R+G+B)/3.
    arr: numpy array of shape (H, W, 3), dtype uint8
    Returns: numpy array of shape (H, W), dtype uint8
    """
    h, w = arr.shape[0], arr.shape[1]
    result = np.zeros((h, w), dtype=np.uint8)
    for r in range(h):
        for c in range(w):
            R, G, B = arr[r, c, 0], arr[r, c, 1], arr[r, c, 2]
            gray = int((R + G + B) / 3)
            result[r, c] = max(0, min(255, gray))
    return result

# YOUR CODE: implement the other methods
def rgb_to_gray_lightness(arr):
    pass

def rgb_to_gray_luminosity(arr):
    pass

def rgb_to_gray_mymethod(arr):
    """Your own formula!"""
    pass

# Test — run average on the color image
gray_average = rgb_to_gray_average(color_arr)
print("Shape:", gray_average.shape)
print("Dtype:", gray_average.dtype)

# YOUR CODE HERE

# Apply all methods
gray_average   = rgb_to_gray_average(color_arr)
# gray_lightness  = rgb_to_gray_lightness(color_arr)
# gray_luminosity = rgb_to_gray_luminosity(color_arr)
# gray_mymethod   = rgb_to_gray_mymethod(color_arr)

# Display all side by side
# show_images([gray_average, gray_lightness, gray_luminosity, gray_mymethod],
#             titles=['Average', 'Lightness', 'Luminosity', 'My Method'],
#             cmap_list=['gray', 'gray', 'gray', 'gray'])

# Compute pixel-wise difference between average and luminosity using loops
# diff[r, c] = abs(gray_average[r,c] - gray_luminosity[r,c])

# YOUR CODE HERE
h, w = gray_average.shape
diff = np.zeros((h, w), dtype=np.uint8)

# for r in range(h):
#     for c in range(w):
#         ...

# show_images([diff], titles=['Difference: Average vs Luminosity'], cmap_list=['hot'])

# SETUP HELPER — run this cell as-is
# Resize the grayscale image to exactly 100x100 using PIL
img_100 = np.array(gray_img.resize((100, 100), Image.LANCZOS))
print("Shape of 100x100 image:", img_100.shape)
show_images([img_100], titles=['100×100 Grayscale'], cmap_list=['gray'])

# METHOD A: Nearest Neighbor Downsampling
def downsample_nearest(img):
    """
    Downsamples a (H, W) image to (H//2, W//2) by taking every other pixel.
    """
    h, w = img.shape
    out_h, out_w = h // 2, w // 2
    result = np.zeros((out_h, out_w), dtype=np.uint8)
    for r in range(out_h):
        for c in range(out_w):
            pass  # result[r, c] = ???
    return result


# METHOD B: Average Pooling
def downsample_average(img):
    """
    Downsamples by averaging each 2x2 block.
    """
    h, w = img.shape
    out_h, out_w = h // 2, w // 2
    result = np.zeros((out_h, out_w), dtype=np.uint8)
    for r in range(out_h):
        for c in range(out_w):
            pass  # result[r, c] = average of 2x2 block
    return result


# METHOD C: Max Pooling
def downsample_max(img):
    """
    Downsamples by taking the maximum of each 2x2 block.
    """
    h, w = img.shape
    out_h, out_w = h // 2, w // 2
    result = np.zeros((out_h, out_w), dtype=np.uint8)
    for r in range(out_h):
        for c in range(out_w):
            pass  # result[r, c] = max of 2x2 block
    return result


# METHOD D: YOUR OWN
def downsample_mymethod(img):
    """Your own downsampling method — describe it in the docstring!"""
    pass


# Test one of them
small = downsample_nearest(img_100)
print("Output shape:", small.shape)  # Should be (50, 50)

# YOUR CODE HERE

# Apply all methods
small_nearest = downsample_nearest(img_100)
# small_average  = downsample_average(img_100)
# small_max      = downsample_max(img_100)
# small_mymethod = downsample_mymethod(img_100)

# Display side by side with original
# show_images(
#     [img_100, small_nearest, small_average, small_max, small_mymethod],
#     titles=['Original 100x100', 'Nearest (50x50)', 'Average (50x50)', 'Max (50x50)', 'My Method (50x50)'],
#     cmap_list=['gray'] * 5
# )

# Compute difference map between nearest and average (using loops)
h, w = small_nearest.shape
diff_down = np.zeros((h, w), dtype=np.uint8)

# YOUR LOOP HERE
# for r in range(h):
#     for c in range(w):
#         diff_down[r, c] = abs(int(small_nearest[r,c]) - int(small_average[r,c]))

# show_images([diff_down], titles=['Difference: Nearest vs Average'], cmap_list=['hot'])

# Use the 50x50 image from Part 4
# If you didn't finish Part 4, here's a fallback:
img_50 = small_nearest if 'small_nearest' in dir() and small_nearest is not None else np.array(gray_img.resize((50, 50)))
print("Working with 50x50 image, shape:", img_50.shape)
show_images([img_50], titles=['50×50 Input'], cmap_list=['gray'])

# METHOD A: Nearest Neighbor Upsampling
def upsample_nearest(img, scale=2):
    """
    Upsamples a (H, W) image to (H*scale, W*scale) by pixel replication.
    Each output pixel (r, c) copies from input (r//scale, c//scale).
    """
    h, w = img.shape
    out_h, out_w = h * scale, w * scale
    result = np.zeros((out_h, out_w), dtype=np.uint8)
    for r in range(out_h):
        for c in range(out_w):
            pass  # result[r, c] = ???
    return result


# METHOD B: Bilinear Interpolation
def lerp(a, b, t):
    """Linear interpolation between a and b. t=0 gives a, t=1 gives b."""
    pass  # return ???

def upsample_bilinear(img, scale=2):
    """
    Upsamples using bilinear interpolation.
    For each output pixel (r, c):
      - Map to input coordinates: in_r = r / scale, in_c = c / scale
      - Find the four surrounding input pixels
      - Interpolate
    """
    h, w = img.shape
    out_h, out_w = h * scale, w * scale
    result = np.zeros((out_h, out_w), dtype=np.uint8)
    for r in range(out_h):
        for c in range(out_w):
            # Map output coordinates to input space
            in_r = r / scale
            in_c = c / scale

            # Find surrounding pixel indices
            r0 = int(in_r)          # floor
            c0 = int(in_c)          # floor
            r1 = min(r0 + 1, h - 1) # ceiling, clamped to image
            c1 = min(c0 + 1, w - 1)

            # Fractional parts (where between r0 and r1 are we?)
            dr = in_r - r0
            dc = in_c - c0

            # Bilinear interpolation: interpolate in r direction, then c
            # Step 1: interpolate the top row and bottom row
            # top    = lerp(img[r0, c0], img[r0, c1], dc)
            # bottom = lerp(img[r1, c0], img[r1, c1], dc)
            # Step 2: interpolate between top and bottom
            # value = lerp(top, bottom, dr)

            # YOUR CODE HERE
            pass

    return result


# METHOD C: YOUR OWN
def upsample_mymethod(img, scale=2):
    """Your own upsampling method!"""
    pass


# Test Method A
big_nearest = upsample_nearest(img_50)
print("Output shape:", big_nearest.shape)  # Should be (100, 100)

# YOUR CODE HERE

# Apply all methods
big_nearest   = upsample_nearest(img_50)
# big_bilinear  = upsample_bilinear(img_50)
# big_mymethod  = upsample_mymethod(img_50)

# Display all vs original
# show_images(
#     [img_100, big_nearest, big_bilinear, big_mymethod],
#     titles=['Original 100x100', 'Nearest (100x100)', 'Bilinear (100x100)', 'My Method'],
#     cmap_list=['gray'] * 4
# )

# Compute MAE for each method vs the original (using loops)
def mean_absolute_error(img_a, img_b):
    """
    Computes pixel-wise mean absolute error between two same-size images.
    Use only Python loops — no np.mean, no array subtraction.
    """
    h, w = img_a.shape
    total = 0
    for r in range(h):
        for c in range(w):
            pass  # total += ???
    return total / (h * w)

# Compute and print MAE for each method
mae_nearest = mean_absolute_error(big_nearest, img_100)
print(f"MAE (Nearest):  {mae_nearest:.4f}")

# Add bilinear and mymethod when ready
# mae_bilinear = mean_absolute_error(big_bilinear, img_100)
# print(f"MAE (Bilinear): {mae_bilinear:.4f}")

# METHOD A: Nearest Neighbor Resize (arbitrary target size)
def resize_nearest(img, target_h, target_w):
    """
    Resizes img to (target_h, target_w) using nearest neighbor.
    For output pixel (r, c), map to input (round(r * h / target_h), round(c * w / target_w))
    or equivalently: input_r = int(r * h / target_h), clamped to [0, h-1].
    """
    h, w = img.shape
    result = np.zeros((target_h, target_w), dtype=np.uint8)
    for r in range(target_h):
        for c in range(target_w):
            # Map to input coordinates
            # in_r = ???  (use int(...) to round down)
            # in_c = ???
            # Clamp to valid range: in_r must be < h, in_c must be < w
            pass
    return result


# METHOD B: Bilinear Resize (arbitrary target size)
def resize_bilinear(img, target_h, target_w):
    """
    Resizes img to (target_h, target_w) using bilinear interpolation.
    For output pixel (r, c), the input coordinates are:
      in_r = r * (h - 1) / (target_h - 1)
      in_c = c * (w - 1) / (target_w - 1)
    Then bilinearly interpolate.
    """
    h, w = img.shape
    result = np.zeros((target_h, target_w), dtype=np.uint8)
    for r in range(target_h):
        for c in range(target_w):
            # Input coordinates (note: use (h-1)/(target_h-1) to map edges correctly)
            in_r = r * (h - 1) / max(1, target_h - 1)
            in_c = c * (w - 1) / max(1, target_w - 1)

            r0 = int(in_r)
            c0 = int(in_c)
            r1 = min(r0 + 1, h - 1)
            c1 = min(c0 + 1, w - 1)

            dr = in_r - r0
            dc = in_c - c0

            # YOUR BILINEAR INTERPOLATION HERE
            pass
    return result


# Test: resize 50x50 to 150x150
# img_150_nearest  = resize_nearest(img_50, 150, 150)
# img_150_bilinear = resize_bilinear(img_50, 150, 150)
# print("150x150 shapes:", img_150_nearest.shape, img_150_bilinear.shape)

# YOUR CODE HERE: Apply and display

# Resize to 150x150
# show_images([img_50, img_150_nearest, img_150_bilinear],
#             titles=['Original 50x50', 'Nearest (150x150)', 'Bilinear (150x150)'],
#             cmap_list=['gray', 'gray', 'gray'])

# Resize to 75x75
# img_75_nearest  = resize_nearest(img_50, 75, 75)
# img_75_bilinear = resize_bilinear(img_50, 75, 75)
# show_images([img_50, img_75_nearest, img_75_bilinear],
#             titles=['Original 50x50', 'Nearest (75x75)', 'Bilinear (75x75)'],
#             cmap_list=['gray', 'gray', 'gray'])

# YOUR CODE HERE
patch = img_50[:10, :10]
print("Patch shape:", patch.shape)

# patch_200_nearest  = resize_nearest(patch, 200, 200)
# patch_200_bilinear = resize_bilinear(patch, 200, 200)

# show_images([patch, patch_200_nearest, patch_200_bilinear],
#             titles=['10x10 Patch', 'Nearest (200x200)', 'Bilinear (200x200)'],
#             cmap_list=['gray', 'gray', 'gray'],
#             figsize=(15, 5))

def conv(image, weights):
    """
    Applies a convolution filter to a grayscale image.

    Parameters:
        image   : 2D numpy array of shape (H, W)
        weights : 2D numpy array of shape (K, K) — the filter kernel

    Returns:
        output  : 2D numpy array of shape (H-K+1, W-K+1)
                  Contains the raw convolution output (may not be in [0,255])
    """
    H, W = image.shape
    K    = weights.shape[0]  # Kernel size (assume square)

    out_H = H - K + 1
    out_W = W - K + 1

    output = np.zeros((out_H, out_W), dtype=np.float64)

    for r in range(out_H):
        for c in range(out_W):
            total = 0.0
            for i in range(K):
                for j in range(K):
                    pass  # total += ???
            output[r, c] = total

    return output


# SANITY CHECK: Identity filter — should return the original image (minus edges)
identity_kernel = np.array([
    [0, 0, 0],
    [0, 1, 0],
    [0, 0, 0]
], dtype=np.float64)

result = conv(img_100.astype(np.float64), identity_kernel)
print("Output shape:", result.shape)            # Should be (98, 98)

# Check: result[0,0] should equal img_100[1,1]
print(f"result[0,0] = {result[0,0]:.1f}")
print(f"img_100[1,1] = {img_100[1,1]}")
print("Match:", abs(result[0,0] - float(img_100[1,1])) < 1e-9)

# DISPLAY HELPER for convolution output — run this cell as-is
def show_conv_result(original, output, title='Convolution Output', clip=False):
    """
    Displays the original image and convolution output side by side.
    Normalizes the output to [0, 255] for display.

    Parameters:
        original : the input image (2D array, uint8)
        output   : the convolution result (2D float array)
        clip     : if True, clip to [0,255] instead of normalizing
    """
    if clip:
        display_out = np.clip(output, 0, 255).astype(np.uint8)
    else:
        # Normalize to [0, 255]
        lo, hi = output.min(), output.max()
        if hi > lo:
            display_out = ((output - lo) / (hi - lo) * 255).astype(np.uint8)
        else:
            display_out = np.zeros_like(output, dtype=np.uint8)

    # Trim original to match output size
    pad = (original.shape[0] - display_out.shape[0]) // 2
    orig_trimmed = original[pad:pad+display_out.shape[0], pad:pad+display_out.shape[1]]

    show_images(
        [orig_trimmed, display_out],
        titles=['Original (trimmed)', title],
        cmap_list=['gray', 'gray']
    )

print("show_conv_result() helper ready.")

# Define the kernels
kernel_blur = np.array([
    [1/9, 1/9, 1/9],
    [1/9, 1/9, 1/9],
    [1/9, 1/9, 1/9]
])

kernel_sharpen = np.array([
    [ 0, -1,  0],
    [-1,  5, -1],
    [ 0, -1,  0]
], dtype=np.float64)

kernel_sobel_h = np.array([
    [-1, -2, -1],
    [ 0,  0,  0],
    [ 1,  2,  1]
], dtype=np.float64)

kernel_sobel_v = np.array([
    [-1,  0,  1],
    [-2,  0,  2],
    [-1,  0,  1]
], dtype=np.float64)


# Apply and display — YOUR CODE

# Kernel A: Blur
result_blur = conv(img_100.astype(np.float64), kernel_blur)
show_conv_result(img_100, result_blur, title='Blur')
# What do you observe? Write below.

# Kernel B: Sharpen
# result_sharpen = ???
# show_conv_result(img_100, result_sharpen, title='Sharpen')

# Kernel C: Horizontal Edges
# result_sobel_h = ???

# Kernel D: Vertical Edges
# result_sobel_v = ???

# Combine horizontal and vertical edges into edge magnitude
# edge_magnitude[r, c] = sqrt(result_sobel_h[r,c]**2 + result_sobel_v[r,c]**2)

# YOUR CODE (use a loop, use import math or ** 0.5)
import math

# h, w = result_sobel_h.shape
# edge_magnitude = np.zeros((h, w), dtype=np.float64)
# for r in range(h):
#     for c in range(w):
#         edge_magnitude[r, c] = ???

# show_conv_result(img_100, edge_magnitude, title='Edge Magnitude (Sobel)')

# Task 1: Your own 3x3 filter
my_kernel = np.array([
    [0, 0, 0],
    [0, 1, 0],  # Change these!
    [0, 0, 0]
], dtype=np.float64)

# Apply and display
# result_mine = conv(img_100.astype(np.float64), my_kernel)
# show_conv_result(img_100, result_mine, title='My Filter')

# Task 2: 5x5 blur
kernel_blur_5x5 = np.full((5, 5), 1/25)
# result_blur_5 = conv(img_100.astype(np.float64), kernel_blur_5x5)
# show_conv_result(img_100, result_blur_5, title='5x5 Blur')

# Task 3: Gaussian-like blur
# Design the kernel: center=4, direct neighbors=2, corners=1, normalized
# YOUR CODE
gaussian_approx = np.array([
    [1, 2, 1],
    [2, 4, 2],
    [1, 2, 1]
], dtype=np.float64)
# Normalize so weights sum to 1:
# gaussian_approx = gaussian_approx / ???
# result_gaussian = conv(img_100.astype(np.float64), gaussian_approx)
# show_conv_result(img_100, result_gaussian, title='Gaussian-like Blur')

# Task 4: Apply blur multiple times
# YOUR CODE
img_float = img_100.astype(np.float64)

# Apply blur once
# blurred_1 = conv(img_float, kernel_blur)

# Apply again
# blurred_2 = conv(blurred_1, kernel_blur)

# Apply 5 times using a loop
# current = img_float
# for _ in range(5):
#     current = conv(current, kernel_blur)
# blurred_5 = current

# Display original, 1x blurred, 2x blurred, 5x blurred
# show_images([img_100, ...], titles=['Original', '1x blur', '2x blur', '5x blur'], cmap_list=['gray']*4)

def pad_image(img, pad_size):
    """
    Pads a (H, W) image with `pad_size` zeros on all sides.
    Returns a (H + 2*pad_size, W + 2*pad_size) array.
    
    Implement using loops — no np.pad!
    """
    H, W = img.shape
    new_H = H + 2 * pad_size
    new_W = W + 2 * pad_size
    result = np.zeros((new_H, new_W), dtype=img.dtype)
    # Copy img into the center of result
    # YOUR CODE HERE
    for r in range(H):
        for c in range(W):
            pass  # result[r + pad_size, c + pad_size] = ???
    return result


def conv_same(image, weights):
    """
    Convolution with 'same' padding: output is the same size as input.
    Uses pad_image internally.
    """
    K = weights.shape[0]
    pad_size = (K - 1) // 2
    # YOUR CODE: pad the image, then call conv on the padded version
    pass


# Test
padded = pad_image(img_100, pad_size=1)
print("Padded shape:", padded.shape)  # Should be (102, 102)

# result_same = conv_same(img_100.astype(np.float64), kernel_blur)
# print("conv_same output shape:", result_same.shape)  # Should be (100, 100)

def conv_color(image_rgb, weights):
    """
    Applies conv_same independently to each color channel.
    image_rgb: (H, W, 3) uint8 array
    weights  : (K, K) kernel
    Returns  : (H, W, 3) float64 array
    """
    H, W = image_rgb.shape[0], image_rgb.shape[1]
    result = np.zeros((H, W, 3), dtype=np.float64)

    for ch in range(3):  # ch = 0 (R), 1 (G), 2 (B)
        channel = image_rgb[:, :, ch].astype(np.float64)
        # Apply conv_same to this channel
        # result[:, :, ch] = ???
        pass

    return result


# Apply blur to color image and display
# color_blurred = conv_color(color_arr, kernel_blur)

# DISPLAY HELPER for color convolution output
def show_color_conv(original, output, title='Color Convolution'):
    lo = output.min()
    hi = output.max()
    if hi > lo:
        display = ((output - lo) / (hi - lo) * 255).astype(np.uint8)
    else:
        display = np.zeros_like(output, dtype=np.uint8)
    show_images([original, display], titles=['Original', title])

# show_color_conv(color_arr, color_blurred, title='Color Blur')

# YOUR MINI PIPELINE

# Step 1: Grayscale
# step1_gray = rgb_to_gray_luminosity(color_arr)

# Step 2: Resize to 50x50
# step2_small = resize_bilinear(step1_gray, 50, 50)

# Step 3: Blur
# step3_blur = conv_same(step2_small.astype(np.float64), kernel_blur)

# Step 4: Edge detection
# step4_edges_h = conv_same(step3_blur, kernel_sobel_h)
# step4_edges_v = conv_same(step3_blur, kernel_sobel_v)
# step4_edges   = edge magnitude of h and v combined (from Exercise 7.4)

# Display all steps
# show_images(
#     [color_arr, step1_gray, step2_small, np.clip(step3_blur, 0, 255).astype(np.uint8), ...],
#     titles=['1. Color', '2. Grayscale', '3. 50x50', '4. Blurred', '5. Edges'],
#     cmap_list=[None, 'gray', 'gray', 'gray', 'gray']
# )

print("Fill in each step above!")

# YOUR DIAGONAL EDGE DETECTOR

# Think: for a '\\' edge (top-left bright, bottom-right dark),
# which pixels in a 3x3 neighborhood would be bright and which dark?
# Replace the zeros below with your values (use positive and negative numbers).

kernel_diag_backslash = np.array([
    [0, 0, 0],   # <-- replace with your values
    [0, 0, 0],
    [0, 0, 0]
], dtype=np.float64)

# Hint: look at the Sobel kernels for inspiration.
# The horizontal Sobel uses +1/-1 to detect top vs. bottom.
# What values detect top-left vs. bottom-right?

# result_diag = conv_same(img_100.astype(np.float64), kernel_diag_backslash)
# show_conv_result(img_100, result_diag, title='Diagonal Edge Detector (\\\\)')

# YOUR CODE HERE

# Apply sharpen multiple times
current = img_100.astype(np.float64)
snapshots = []
for i in range(10):
    current = conv_same(current, kernel_sharpen)
    if i + 1 in [1, 3, 5, 10]:
        snapshots.append((i + 1, current.copy()))

# Display snapshots
# images = [snap for (_, snap) in snapshots]
# titles = [f'{n}x sharpen' for (n, _) in snapshots]
# ... normalize and display

Method	Formula
Average	$\frac{R + G + B}{3}$
Lightness	$\frac{\max(R,G,B) + \min(R,G,B)}{2}$
Luminosity (ITU-R BT.601)	$0.299 R + 0.587 G + 0.114 B$
Your own idea	(whatever you came up with above)

Learning Convolutions by Inventing Computer Vision¶

What you'll need¶

PART 1: What Is an Image?¶

Exercise 1.1 — Load and Look¶

Exercise 1.2 — Peek Inside: Images as Numbers¶

Exercise 1.3 — Navigate the Grid¶

Exercise 1.4 — Visualize a Tiny Slice¶

PART 2: Extracting a Color Channel¶

Exercise 2.1 — What Are R, G, B?¶

Exercise 2.2 — Extract the Red Channel Using Loops¶

Exercise 2.3 — Visualize a Single Channel in Its True Color¶

PART 3: Converting Color to Grayscale¶

Exercise 3.1 — What Is Grayscale?¶

Exercise 3.2 — Implement Your Formulas¶

Exercise 3.3 — Compare the Methods¶

PART 4: Shrinking an Image — Downsampling¶

Exercise 4.1 — Set Up: Get a 100×100 Grayscale Image¶

Exercise 4.2 — Think Before You Code¶

Exercise 4.3 — Implement Three Downsampling Methods¶

Exercise 4.4 — Compare and Analyze¶

PART 5: Growing an Image — Upsampling to 100×100¶

Exercise 5.1 — The Reverse Problem¶

Exercise 5.2 — Implement Three Upsampling Methods¶

Exercise 5.3 — Compare and Analyze¶

PART 6: Upsampling to a Non-Integer Scale — 50×50 to 150×150¶

Exercise 6.1 — A New Challenge¶

Exercise 6.2 — Extreme Upsampling¶

PART 7: Designing a Convolution¶

Exercise 7.1 — The Neighborhood Idea¶

Exercise 7.2 — Your First Convolution¶

Exercise 7.3 — Helper for Displaying Convolution Output¶

Exercise 7.4 — Discover What Filters Do¶

Exercise 7.5 — Invent Your Own Filter¶

Exercise 7.6 — Add Padding¶

Exercise 7.7 — Convolution on a Color Image¶

PART 8: Pulling It All Together¶

Exercise 8.1 — Build a Mini Image Processing Pipeline¶

Exercise 8.2 — Bonus: Design a Filter by Intuition¶

Exercise 8.3 — Bonus: What Does Repeated Convolution Do?¶

Final Reflection¶