import numpy as np
import matplotlib.pyplot as plt

import numpy as np
import matplotlib.pyplot as plt
%matplotlib inline

# PLOTTING HELPER — run this cell as-is, you'll use plot_function() throughout the notebook
def plot_function(f, x_range=(-3, 3), num_points=500, title="f(x)", mark_x=None):
    """
    Plots a function f over x_range.
    Optionally marks a specific x value with a red dot.

    Parameters:
        f        : a Python function that takes a number and returns a number
        x_range  : tuple (x_min, x_max)
        title    : string label for the plot
        mark_x   : if provided, draws a red dot at (mark_x, f(mark_x))
    """
    xs = np.linspace(x_range[0], x_range[1], num_points)
    ys = [f(x) for x in xs]
    plt.figure(figsize=(8, 4))
    plt.plot(xs, ys, 'b-', linewidth=2)
    if mark_x is not None:
        plt.plot(mark_x, f(mark_x), 'ro', markersize=10, label=f'x={mark_x:.4f}, f(x)={f(mark_x):.4f}')
        plt.legend()
    plt.title(title)
    plt.xlabel('x')
    plt.ylabel('f(x)')
    plt.grid(True)
    plt.show()

# PLOTTING HELPER — run this cell as-is
def plot_function(f, x_range=(-3, 3), num_points=500, title="f(x)", mark_x=None):
    xs = np.linspace(x_range[0], x_range[1], num_points)
    ys = [f(x) for x in xs]
    plt.figure(figsize=(8, 4))
    plt.plot(xs, ys, 'b-', linewidth=2)
    if mark_x is not None:
        plt.plot(mark_x, f(mark_x), 'ro', markersize=10, label=f'x={mark_x:.4f}, f(x)={f(mark_x):.4f}')
        plt.legend()
    plt.title(title)
    plt.xlabel('x')
    plt.ylabel('f(x)')
    plt.grid(True)
    plt.show()

# YOUR CODE HERE
# Step 1: Define f(x) = x^4 - 4x + 10
def f(x):
    pass  # replace this

# Step 2: Plot it
# plot_function(...)

# Step 3: Write your visual estimate of the minimum below
# My guess: x ≈ ???

# Template for recording your guesses:
guesses = [
    # (x_value, f(x_value))
    # e.g. (1.0, f(1.0)),
]

# YOUR CODE HERE — try different values of mark_x
plot_function(f, mark_x=1.0, title="My guess: x=1.0")

# Record all your guesses here
guesses = [
    # (x_value, f(x_value))
]

# Print them nicely
print(f"{'Guess #':<10} {'x':<15} {'f(x)':<15}")
print("-" * 40)
for i, (x, fx) in enumerate(guesses):
    print(f"{i+1:<10} {x:<15.6f} {fx:<15.6f}")

# YOUR CODE HERE
def numerical_derivative(f, x, h=1e-5):
    """
    Returns the approximate derivative of f at point x.
    """
    pass  # replace this


# Test it
test_points = [0, 1, 1.5, 2]
for x in test_points:
    slope = numerical_derivative(f, x)
    # print x, slope, and direction

# YOUR CODE HERE
alpha = 0.01
x = 2.0

print(f"{'Step':<8} {'x':<15} {'f(x)':<15} {'slope':<15}")
print("-" * 55)

for step in range(5):
    slope = numerical_derivative(f, x)
    print(f"{step:<8} {x:<15.6f} {f(x):<15.6f} {slope:<15.6f}")
    x = x - alpha * slope  # the update rule

def find_minima_1d(f, x_start, alpha=0.01, epsilon=1e-6, max_steps=10000):
    """
    Finds the x that minimizes f using gradient descent.

    Parameters:
        f         : function to minimize
        x_start   : starting point
        alpha     : learning rate
        epsilon   : stop when |slope| < epsilon
        max_steps : maximum number of steps

    Returns:
        x_min     : the x value at the minimum
        f_min     : the function value at the minimum
        history   : list of (step, x, f(x)) tuples
    """
    pass  # YOUR IMPLEMENTATION

# YOUR CODE HERE
def find_minima_1d(f, x_start, alpha=0.01, epsilon=1e-6, max_steps=10000):
    pass


# Test it
x_min, f_min, history = find_minima_1d(f, x_start=2.0)
print(f"Minimum found at x = {x_min:.6f}")
print(f"f(x_min) = {f_min:.6f}")
print(f"Steps taken: {len(history)}")

# PLOTTING HELPER — descent path
def plot_descent(f, history, x_range=(-3, 3), title="Gradient Descent"):
    """
    Plots the function and shows how x evolved during descent.
    history: list of (step, x, f(x)) tuples
    """
    xs = np.linspace(x_range[0], x_range[1], 500)
    ys = [f(x) for x in xs]

    steps, xvals, fvals = zip(*history)

    plt.figure(figsize=(12, 4))

    # Left: function with descent path
    plt.subplot(1, 2, 1)
    plt.plot(xs, ys, 'b-', linewidth=2, label='f(x)')
    plt.plot(xvals, fvals, 'ro-', markersize=3, alpha=0.5, label='descent path')
    plt.plot(xvals[-1], fvals[-1], 'g*', markersize=15, label=f'minimum: x={xvals[-1]:.4f}')
    plt.title(title)
    plt.xlabel('x'); plt.ylabel('f(x)'); plt.legend(); plt.grid(True)

    # Right: f(x) over steps
    plt.subplot(1, 2, 2)
    plt.plot(steps, fvals, 'b-')
    plt.title('f(x) value over steps')
    plt.xlabel('step'); plt.ylabel('f(x)'); plt.grid(True)

    plt.tight_layout()
    plt.show()

# PLOTTING HELPER — run this cell as-is
def plot_descent(f, history, x_range=(-3, 3), title="Gradient Descent"):
    xs = np.linspace(x_range[0], x_range[1], 500)
    ys = [f(x) for x in xs]
    steps, xvals, fvals = zip(*history)
    plt.figure(figsize=(12, 4))
    plt.subplot(1, 2, 1)
    plt.plot(xs, ys, 'b-', linewidth=2, label='f(x)')
    plt.plot(xvals, fvals, 'ro-', markersize=3, alpha=0.5, label='descent path')
    plt.plot(xvals[-1], fvals[-1], 'g*', markersize=15, label=f'minimum: x={xvals[-1]:.4f}')
    plt.title(title); plt.xlabel('x'); plt.ylabel('f(x)'); plt.legend(); plt.grid(True)
    plt.subplot(1, 2, 2)
    plt.plot(steps, fvals, 'b-')
    plt.title('f(x) over steps'); plt.xlabel('step'); plt.ylabel('f(x)'); plt.grid(True)
    plt.tight_layout()
    plt.show()

# YOUR CODE HERE
# Experiment 1: Default settings
x_min, f_min, history = find_minima_1d(f, x_start=2.0)
plot_descent(f, history)

# Experiment 2: Different starting point
# ...

# Experiment 3: Different learning rates
# ...

# Function A
def fA(x):
    return x**6 - 4*x**2 + 10

plot_function(fA, x_range=(-2, 2), title="fA: x^6 - 4x^2 + 10")

# YOUR CODE: run find_minima_1d and plot_descent
# What do you notice? Are there multiple minima?

# Function B — YOUR CODE
def fB(x):
    pass

# plot, find_minima_1d, plot_descent

# Function C — YOUR CODE
def fC(x):
    pass

# plot, find_minima_1d, plot_descent

# Function D — YOUR CODE
def fD(x):
    pass

# plot, find_minima_1d, plot_descent

# Function E — YOUR CODE
def fE(x):
    pass

# plot, find_minima_1d, plot_descent

# YOUR CODE HERE
for x_start in [1.5, -1.5, 0.0]:
    x_min, f_min, history = find_minima_1d(fA, x_start=x_start, alpha=0.01)
    print(f"Start: x={x_start:.1f}  →  Minimum at x={x_min:.6f}, f(x)={f_min:.6f}")

# PLOTTING HELPER — 2D contour plot
def plot_function_2d(f2, x_range=(-3, 3), y_range=(-3, 3), num_points=100, title="f(x,y)", mark_xy=None):
    """
    Plots a 2-variable function as a contour map.

    Parameters:
        f2       : function that takes (x, y) and returns a scalar
        x_range  : (x_min, x_max)
        y_range  : (y_min, y_max)
        mark_xy  : if provided as (x, y), draws a red dot at that point
    """
    xs = np.linspace(x_range[0], x_range[1], num_points)
    ys = np.linspace(y_range[0], y_range[1], num_points)
    X, Y = np.meshgrid(xs, ys)
    Z = np.array([[f2(x, y) for x in xs] for y in ys])

    plt.figure(figsize=(6, 5))
    contour = plt.contourf(X, Y, Z, levels=30, cmap='viridis')
    plt.colorbar(contour)
    if mark_xy is not None:
        plt.plot(mark_xy[0], mark_xy[1], 'r*', markersize=15,
                 label=f'({mark_xy[0]:.3f}, {mark_xy[1]:.3f})')
        plt.legend()
    plt.title(title)
    plt.xlabel('x'); plt.ylabel('y')
    plt.show()

# PLOTTING HELPER — run this cell as-is
def plot_function_2d(f2, x_range=(-3, 3), y_range=(-3, 3), num_points=100, title="f(x,y)", mark_xy=None):
    xs = np.linspace(x_range[0], x_range[1], num_points)
    ys = np.linspace(y_range[0], y_range[1], num_points)
    X, Y = np.meshgrid(xs, ys)
    Z = np.array([[f2(x, y) for x in xs] for y in ys])
    plt.figure(figsize=(6, 5))
    contour = plt.contourf(X, Y, Z, levels=30, cmap='viridis')
    plt.colorbar(contour)
    if mark_xy is not None:
        plt.plot(mark_xy[0], mark_xy[1], 'r*', markersize=15,
                 label=f'({mark_xy[0]:.3f}, {mark_xy[1]:.3f})')
        plt.legend()
    plt.title(title); plt.xlabel('x'); plt.ylabel('y')
    plt.show()

# YOUR CODE HERE
def g(x, y):
    return x**2 + y**2

plot_function_2d(g, title="g(x,y) = x^2 + y^2")

# Now define and plot h1, h2, h3
# ...

# YOUR CODE HERE
def partial_x(f2, x, y, h=1e-5):
    pass

def partial_y(f2, x, y, h=1e-5):
    pass

def gradient_2d(f2, x, y, h=1e-5):
    pass


# Test on g(x,y) = x^2 + y^2
test_points = [(1, 1), (3, 0), (0, 0)]
for (x, y) in test_points:
    grad = gradient_2d(g, x, y)
    print(f"Gradient at ({x}, {y}) = {grad}")

# YOUR CODE HERE
def find_minima_2d(f2, x_start, y_start, alpha=0.1, epsilon=1e-6, max_steps=10000):
    pass


# Test on g
x_min, y_min, f_min, history = find_minima_2d(g, x_start=2.0, y_start=3.0)
print(f"g: minimum at ({x_min:.4f}, {y_min:.4f}), f={f_min:.6f}, steps={len(history)}")
plot_function_2d(g, mark_xy=(x_min, y_min), title="g: descent result")

# Test on h1
def h1(x, y):
    return (x - 1)**2 + (y + 2)**2

# YOUR CODE: run find_minima_2d and verify

# Test on h2
def h2(x, y):
    return x**2 + 4*y**2

# YOUR CODE: run find_minima_2d and verify
# Try alpha=0.1. Does it converge? Try alpha=0.3. What happens?

# PLOTTING HELPER — 2D descent path
def plot_descent_2d(f2, history, x_range=(-4, 4), y_range=(-4, 4), title="2D Gradient Descent"):
    """
    history: list of (step, x, y, f(x,y)) tuples
    """
    xs = np.linspace(x_range[0], x_range[1], 100)
    ys = np.linspace(y_range[0], y_range[1], 100)
    X, Y = np.meshgrid(xs, ys)
    Z = np.array([[f2(x, y) for x in xs] for y in ys])

    steps, xvals, yvals, fvals = zip(*history)

    plt.figure(figsize=(12, 5))

    plt.subplot(1, 2, 1)
    plt.contourf(X, Y, Z, levels=30, cmap='viridis')
    plt.colorbar()
    plt.plot(xvals, yvals, 'w-o', markersize=3, alpha=0.6, label='path')
    plt.plot(xvals[0], yvals[0], 'rs', markersize=10, label='start')
    plt.plot(xvals[-1], yvals[-1], 'g*', markersize=15, label='end')
    plt.legend(); plt.title(title); plt.xlabel('x'); plt.ylabel('y')

    plt.subplot(1, 2, 2)
    plt.plot(steps, fvals, 'b-')
    plt.title('f(x,y) over steps'); plt.xlabel('step'); plt.ylabel('f(x,y)'); plt.grid(True)

    plt.tight_layout()
    plt.show()

# PLOTTING HELPER — run this cell as-is
def plot_descent_2d(f2, history, x_range=(-4, 4), y_range=(-4, 4), title="2D Gradient Descent"):
    xs = np.linspace(x_range[0], x_range[1], 100)
    ys = np.linspace(y_range[0], y_range[1], 100)
    X, Y = np.meshgrid(xs, ys)
    Z = np.array([[f2(x, y) for x in xs] for y in ys])
    steps, xvals, yvals, fvals = zip(*history)
    plt.figure(figsize=(12, 5))
    plt.subplot(1, 2, 1)
    plt.contourf(X, Y, Z, levels=30, cmap='viridis')
    plt.colorbar()
    plt.plot(xvals, yvals, 'w-o', markersize=3, alpha=0.6, label='path')
    plt.plot(xvals[0], yvals[0], 'rs', markersize=10, label='start')
    plt.plot(xvals[-1], yvals[-1], 'g*', markersize=15, label='end')
    plt.legend(); plt.title(title); plt.xlabel('x'); plt.ylabel('y')
    plt.subplot(1, 2, 2)
    plt.plot(steps, fvals, 'b-')
    plt.title('f(x,y) over steps'); plt.xlabel('step'); plt.ylabel('f(x,y)'); plt.grid(True)
    plt.tight_layout()
    plt.show()

# YOUR CODE HERE
# Run descent on h2 with different alphas and visualize

def find_minima(f, variables, alpha=0.01, epsilon=1e-6, max_steps=100000):
    """
    Finds the values of 'variables' that minimize f.

    Parameters:
        f         : a function that takes a LIST of values and returns a scalar
                    e.g., if variables = [x, y], then f([x, y]) should work
        variables : initial guess, a list of numbers [v1, v2, ..., vN]
        alpha     : learning rate
        epsilon   : stop when gradient magnitude < epsilon
        max_steps : maximum number of steps

    Returns:
        min_vars  : list of variable values at the minimum
        f_min     : function value at the minimum
        history   : list of (step, variables_copy, f_value) tuples
    """
    pass

# YOUR CODE HERE
def compute_gradient(f, variables, h=1e-5):
    """
    Computes numerical gradient of f at 'variables'.
    variables: list of N numbers
    Returns: list of N partial derivatives
    """
    pass


def find_minima(f, variables, alpha=0.01, epsilon=1e-6, max_steps=100000):
    pass


# Test 1D
min_vars, f_min, history = find_minima(lambda v: v[0]**4 - 4*v[0] + 10, [2.0])
print(f"1D minimum: x = {min_vars[0]:.6f}, f = {f_min:.6f}")

# Test 2D
min_vars, f_min, history = find_minima(lambda v: v[0]**2 + v[1]**2, [2.0, 3.0])
print(f"2D minimum: x = {min_vars[0]:.6f}, y = {min_vars[1]:.6f}, f = {f_min:.6f}")

# YOUR CODE HERE
def p(v):
    x, y, z = v
    return (x - 1)**2 + (y - 2)**2 + (z + 3)**2

def q(v):
    x, y, z = v
    return x**2 + 2*y**2 + 3*z**2 - 4*x + 6*z

# Run find_minima on p
min_vars, f_min, history = find_minima(p, [0.0, 0.0, 0.0])
print(f"p minimum: {min_vars}, f = {f_min:.6f}")

# Run find_minima on q
# YOUR CODE

# What is the analytical answer for q?

# DATA — run this cell as-is
np.random.seed(42)
X_data = np.linspace(0, 10, 30)
y_data = 2.5 * X_data + 4.0 + np.random.randn(30) * 3  # true line: m=2.5, c=4.0 + noise

print(f"Number of data points: {len(X_data)}")
print(f"X range: [{X_data.min():.1f}, {X_data.max():.1f}]")
print(f"y range: [{y_data.min():.1f}, {y_data.max():.1f}]")

# PLOTTING HELPER — data + line overlay
def plot_data_and_line(X, y, m=None, c=None, title="Data"):
    """
    Plots data points. If m and c are given, also draws the line y = mx + c.
    """
    plt.figure(figsize=(8, 5))
    plt.scatter(X, y, color='blue', label='data', zorder=5)
    if m is not None and c is not None:
        x_line = np.linspace(X.min(), X.max(), 200)
        y_line = m * x_line + c
        plt.plot(x_line, y_line, 'r-', linewidth=2, label=f'y = {m:.2f}x + {c:.2f}')
    plt.legend()
    plt.title(title)
    plt.xlabel('X'); plt.ylabel('y')
    plt.grid(True)
    plt.show()

# YOUR CODE HERE
# 1. Plot just the data
plot_data_and_line(X_data, y_data, title="Raw Data")

# 2. Try some lines — which looks best?
plot_data_and_line(X_data, y_data, m=1.0, c=5.0, title="m=1.0, c=5.0")
# try more...

def mse(X, y, m, c):
    """
    Computes Mean Squared Error for predicting y from X using line y = mx + c.

    Parameters:
        X : array of input values (shape: N,)
        y : array of true output values (shape: N,)
        m : slope of the line
        c : intercept of the line

    Returns:
        mse_value : a single number
    """
    pass

# YOUR CODE HERE
def mse(X, y, m, c):
    pass


# Sanity check
X_tiny = np.array([1.0, 2.0, 3.0])
y_tiny = np.array([3.0, 5.0, 7.0])
print(f"MSE for perfect line (should be 0): {mse(X_tiny, y_tiny, 2.0, 1.0):.6f}")

# Compare on main dataset
lines_to_test = [
    (2.5, 4.0, "true line"),
    (1.0, 5.0, "guess 1"),
    (5.0, 0.0, "guess 2"),
]
for m, c, label in lines_to_test:
    error = mse(X_data, y_data, m, c)
    print(f"{label:15s}: m={m}, c={c}  →  MSE={error:.4f}")

def mse_landscape(m, c):
    return mse(X_data, y_data, m, c)

plot_function_2d(mse_landscape, x_range=(0, 5), y_range=(-5, 15), title="MSE Landscape (m, c)")

# YOUR CODE HERE
def mse_landscape(m, c):
    return mse(X_data, y_data, m, c)

plot_function_2d(mse_landscape, x_range=(0, 5), y_range=(-5, 15),
                 title="MSE Landscape",
                 mark_xy=(2.5, 4.0))

def mse_for_optimizer(params):
    m, c = params
    return mse(X_data, y_data, m, c)

# YOUR CODE HERE
def mse_for_optimizer(params):
    m, c = params
    return mse(X_data, y_data, m, c)


# Run the optimizer — tune alpha if needed
min_params, f_min, history = find_minima(mse_for_optimizer, [0.0, 0.0], alpha=0.001)

m_found, c_found = min_params
print(f"Found:  m = {m_found:.4f},  c = {c_found:.4f}")
print(f"True:   m = 2.5000,  c = 4.0000")
print(f"MSE at found values: {mse(X_data, y_data, m_found, c_found):.4f}")

# Plot the result
plot_data_and_line(X_data, y_data, m=m_found, c=c_found, title=f"Best fit: m={m_found:.2f}, c={c_found:.2f}")

# PLOTTING HELPER — animated learning
def plot_learning_progress(X, y, history, steps_to_show=[0, 5, 20, 100, 500, -1]):
    """
    Shows the fitted line at different stages of training.
    history: list of (step, [m, c], mse_value) tuples from find_minima
    """
    n = len(steps_to_show)
    fig, axes = plt.subplots(1, n, figsize=(4*n, 4))

    history_len = len(history)
    x_line = np.linspace(X.min(), X.max(), 100)

    for ax, step_idx in zip(axes, steps_to_show):
        if step_idx == -1:
            step_idx = history_len - 1
        step_idx = min(step_idx, history_len - 1)

        step_num, params, mse_val = history[step_idx]
        m, c = params
        y_line = m * x_line + c

        ax.scatter(X, y, color='blue', s=15, alpha=0.6)
        ax.plot(x_line, y_line, 'r-', linewidth=2)
        ax.set_title(f'Step {step_num}\nm={m:.2f}, c={c:.2f}\nMSE={mse_val:.1f}')
        ax.set_xlabel('X'); ax.set_ylabel('y')
        ax.grid(True)

    plt.tight_layout()
    plt.show()

# PLOTTING HELPER — run this cell as-is
def plot_learning_progress(X, y, history, steps_to_show=[0, 5, 20, 100, 500, -1]):
    n = len(steps_to_show)
    fig, axes = plt.subplots(1, n, figsize=(4*n, 4))
    history_len = len(history)
    x_line = np.linspace(X.min(), X.max(), 100)
    for ax, step_idx in zip(axes, steps_to_show):
        if step_idx == -1:
            step_idx = history_len - 1
        step_idx = min(step_idx, history_len - 1)
        step_num, params, mse_val = history[step_idx]
        m, c = params
        y_line = m * x_line + c
        ax.scatter(X, y, color='blue', s=15, alpha=0.6)
        ax.plot(x_line, y_line, 'r-', linewidth=2)
        ax.set_title(f'Step {step_num}\nm={m:.2f}, c={c:.2f}\nMSE={mse_val:.1f}')
        ax.set_xlabel('X'); ax.set_ylabel('y'); ax.grid(True)
    plt.tight_layout()
    plt.show()

# YOUR CODE HERE
min_params, f_min, history = find_minima(mse_for_optimizer, [0.0, 0.0], alpha=0.001)

# Visualize the learning process
plot_learning_progress(X_data, y_data, history, steps_to_show=[0, 5, 20, 100, 500, -1])

# DATASETS — run this cell as-is
np.random.seed(7)

# Dataset 1: negative slope
X1 = np.linspace(0, 10, 40)
y1 = -1.5 * X1 + 20 + np.random.randn(40) * 2

# Dataset 2: steep positive slope
X2 = np.linspace(-5, 5, 50)
y2 = 5.0 * X2 - 10 + np.random.randn(50) * 4

# Dataset 3: nearly flat
X3 = np.linspace(0, 20, 60)
y3 = 0.3 * X3 + 2.0 + np.random.randn(60) * 5

print("Datasets ready: X1/y1, X2/y2, X3/y3")

# YOUR CODE HERE — Dataset 1
plot_data_and_line(X1, y1, title="Dataset 1 — Raw")

def mse_d1(params):
    m, c = params
    return mse(X1, y1, m, c)

# find_minima and plot result

# YOUR CODE HERE — Dataset 2

# YOUR CODE HERE — Dataset 3

# YOUR CODE HERE
m_np, c_np = np.polyfit(X_data, y_data, 1)
print(f"NumPy:          m = {m_np:.4f},  c = {c_np:.4f}")

# Compare with gradient descent result from Exercise 7.1
print(f"Gradient Desc:  m = {m_found:.4f},  c = {c_found:.4f}")

# Repeat for other datasets
# ...

X_quad = np.linspace(-3, 3, 50)
y_quad = 1.5 * X_quad**2 - 2 * X_quad + 1 + np.random.randn(50) * 1.5

# Challenge A — YOUR CODE
X_quad = np.linspace(-3, 3, 50)
y_quad = 1.5 * X_quad**2 - 2 * X_quad + 1 + np.random.randn(50) * 1.5

# Step 1: fit a straight line, report MSE
# Step 2: define mse_quadratic(params) where params = [a, b, c]
# Step 3: find_minima(mse_quadratic, [0, 0, 0])

# Challenge B — YOUR CODE

# Challenge C — YOUR CODE

#	Function	x_range to plot	Suggested x_start
A	$f(x) = x^6 - 4x^2 + 10$	$(-2, 2)$	$1.5$
B	$f(x) = (x - 3)^2 + 5$	$(0, 6)$	$0.0$
C	$f(x) = x^2 + 3\\|x\\|$	$(-4, 4)$	$2.0$
D	$f(x) = e^x - 5x$	$(0, 4)$	$3.0$
E	$f(x) = x^4 - 3x^3 + 2$	$(-1, 3)$	$2.5$

Learning Linear Regression by Inventing Gradient Descent¶

What you'll need¶

PART 1: Finding the Bottom of a Valley¶

Exercise 1.1 — Look Before You Leap¶

Exercise 1.2 — Hit and Trial¶

PART 2: Making the Machine Do the Searching¶

Exercise 2.1 — The Slope Tells You Which Way to Walk¶

Exercise 2.2 — One Step at a Time¶

Exercise 2.3 — Build `find_minima_1d`¶

Exercise 2.4 — Watch It Learn¶

PART 3: Stress-Testing Your Algorithm¶

Exercise 3.1 — New Functions, Same Algorithm¶

Exercise 3.2 — Function A Is Sneaky¶

PART 4: Two Variables — A Landscape Instead of a Curve¶

Exercise 4.1 — See the Landscape¶

Exercise 4.2 — Partial Derivatives¶

Exercise 4.3 — Build `find_minima_2d`¶

Exercise 4.4 — Visualize the Path (2D)¶

PART 5: Going Generic¶

Exercise 5.1 — N Variables¶

Exercise 5.2 — Three Variables¶

PART 6: The Real Problem — Fitting a Line to Data¶

Exercise 6.1 — What Does It Mean to Fit a Line?¶

Exercise 6.2 — Write the MSE Function¶

Exercise 6.3 — The MSE Landscape¶

PART 7: Putting It All Together — Linear Regression via Gradient Descent¶

Exercise 7.1 — Minimize MSE with `find_minima`¶

Exercise 7.2 — Watch the Line Learn¶

Exercise 7.3 — New Dataset, Same Code¶

Exercise 7.4 — Sanity Check with NumPy¶

PART 8: Bonus Challenges¶

Challenge A — What if the data isn't linear?¶

Challenge B — Learning Rate Scheduler¶

Challenge C — Stochastic Gradient Descent¶

Reflection — What Did You Just Build?¶

Learning Linear Regression by Inventing Gradient Descent¶

What you'll need¶

PART 1: Finding the Bottom of a Valley¶

Exercise 1.1 — Look Before You Leap¶

Exercise 1.2 — Hit and Trial¶

PART 2: Making the Machine Do the Searching¶

Exercise 2.1 — The Slope Tells You Which Way to Walk¶

Exercise 2.2 — One Step at a Time¶

Exercise 2.3 — Build find_minima_1d¶

Exercise 2.4 — Watch It Learn¶

PART 3: Stress-Testing Your Algorithm¶

Exercise 3.1 — New Functions, Same Algorithm¶

Exercise 3.2 — Function A Is Sneaky¶

PART 4: Two Variables — A Landscape Instead of a Curve¶

Exercise 4.1 — See the Landscape¶

Exercise 4.2 — Partial Derivatives¶

Exercise 4.3 — Build find_minima_2d¶

Exercise 4.4 — Visualize the Path (2D)¶

PART 5: Going Generic¶

Exercise 5.1 — N Variables¶

Exercise 5.2 — Three Variables¶

PART 6: The Real Problem — Fitting a Line to Data¶

Exercise 6.1 — What Does It Mean to Fit a Line?¶

Exercise 6.2 — Write the MSE Function¶

Exercise 6.3 — The MSE Landscape¶

PART 7: Putting It All Together — Linear Regression via Gradient Descent¶

Exercise 7.1 — Minimize MSE with find_minima¶

Exercise 7.2 — Watch the Line Learn¶

Exercise 7.3 — New Dataset, Same Code¶

Exercise 7.4 — Sanity Check with NumPy¶

PART 8: Bonus Challenges¶

Challenge A — What if the data isn't linear?¶

Challenge B — Learning Rate Scheduler¶

Challenge C — Stochastic Gradient Descent¶

Reflection — What Did You Just Build?¶

Exercise 2.3 — Build `find_minima_1d`¶

Exercise 4.3 — Build `find_minima_2d`¶

Exercise 7.1 — Minimize MSE with `find_minima`¶