split_graph(s1, s2)

def forward(self, x1: float, x2: float) -> float:
    return self.w1.value * x1 + self.w2.value * x2 + self.b.value

from minitorch import Parameter, Module
class Linear(Module):
    def __init__(self, w1, w2, b):
        super().__init__()
        self.w1 = Parameter(w1)
        self.w2 = Parameter(w2)
        self.b = Parameter(b)

    def forward(self, x1: float, x2: float) -> float:
        return self.w1.value * x1 + self.w2.value * x2 + self.b.value

model = Linear(w1=1, w2=1, b=-0.9)
draw_graph(model)

with_points(s1, s2, Linear(1, 1, -0.4))

graph(point_loss, [], [])

graph(point_loss, [], [-2, -0.2, 1])

def point_loss(m_x):
    return minitorch.operators.relu(m_x)

graph(point_loss, [], [])

hcat(
    [show(Linear(1, 1, -0.6)), show(Linear(1, 1, -0.7)), show(Linear(1, 1, -0.8))], 0.3
)

model1 = Linear(w1=1, w2=1, b=-0.4)
model2 = Linear(w1=1, w2=1, b=-0.5)

compare(model1, model2)

with_points(s1, s2, Linear(1, 1, -1.5))

def point_loss(out, y=1):
    return y * -math.log(  # Correct Side
        minitorch.operators.sigmoid(-out)  # Log-Sigmoid
    )  # Distance

def full_loss(m):  # Given m( ; \theta)
    l = 0
    for x, y in zip(s.X, s.y):  # For all training data
        l += point_loss(-m.forward(*x), y)
    return -l

hcat(
    [
        graph(point_loss, [], [-2, -0.2, 1]),
        graph(lambda x: point_loss(-x), [-1, 0.4, 1.3], []),
    ],
    0.3,
)

hcat([show(Linear(1, 1, -1.5)), show(Linear(1, 1, -1.45))], 0.3)

set_svg_height(300)
show_loss(full_loss, Linear(1, 1, 0))

def f(x):
    return x * x + 1.0


plot_function("f(x)", f)

def f_prime(x):
    return 2 * x


def tangent_line(slope, x, y):
    def line(x_):
        return slope * (x_ - x) + y

    return line


plot_function("f(x) vs f'(2)", f, fn2=tangent_line(f_prime(2), 2, f(2)))

plot_function("f(x) = sin(2x)", lambda x: math.sin(2 * x))

plot_function(
    "f'(x) = 2*cos(2x)", lambda x: 2 * math.cos(2 * x), fn2=lambda x: math.sin(2 * x)
)

plot_function3D(
    "f(x, y) = sin(x) + 2 * cos(y)", lambda x, y: math.sin(x) + 2 * math.cos(y)
)

plot_function3D("f'_x(x, y) = cos(x)", lambda x, y: math.cos(x))

def f(x: float) -> float: ...

def derivative(f: Callable[[float], float]) -> Callable[[float], float]:
    def f_prime(x: float) -> float: ...

    return f_prime

def central_difference(f: Callable[[float], float], x: float) -> float: ...

def derivative(f: Callable[[float], float]) -> Callable[[float], float]:
    def f_prime(x: float) -> float:
        return minitorch.central_difference(f, x)

    return f_prime

def f(x, y): ...


def f_x_prime(x: float, y: float) -> float:
    def inner(x: float) -> float:
        return f(x, y)

    return derivative(inner)(x)

def sigmoid(x: float) -> float:
    if x >= 0:
        return 1.0 / (1.0 + math.exp(-x))
    else:
        return math.exp(x) / (1.0 + math.exp(x))


plot_function("sigmoid", sigmoid)

sigmoid_prime = derivative(sigmoid)

plot_function("Derivative of sigmoid", sigmoid_prime)

Module 1.1 - Learning With Derivatives¶

Training Data¶

Math¶

Graphical Notation¶

Model 1¶

Decision Boundary: Model 1¶

Distance Determines Fit¶

Point Loss¶

Warmup: ReLU¶

Loss¶

Lecture Quiz¶

Outline¶

Model Fitting¶

Class Goal¶

Numerical Optimization¶

Iterative Parameter Fitting¶

Example: Update Bias¶

Step 1: Compute Loss¶

Loss¶

Step 2: Find Direction of Improvement¶

Step 3: Update Parameters Iteratively¶

Our Challenge¶

Symbolic Derivatives¶

Review: What is a Derivative?¶

Review: Derivative¶

Review: Derivative¶

Symbolic Derivative¶

Example Function¶

Symbolic Derivative¶

Multiple Arguments¶

Derivatives with Multiple Arguments¶

Review: Symbolic Derivatives¶

Numerical Derivatives¶

What if we don't have symbols?¶

Derivative as higher-order function¶

Definition of Derivative¶

Central Difference¶

Approximating Derivative¶

Derivative as higher-order function¶

Advanced: Mulitiple Arguments¶

Example¶

Example¶

Symbolic¶

Numerical¶

Next Class: Autodifferentiation¶

Module-1¶

Module-1 Learning Objectives¶

Module-1: What is it?¶

Module-1 Overview¶

Q&A¶