draw_boxes(["", "$G(x)$"], [1])


class MyFun(minitorch.Function):
    def forward(ctx, x: Tensor) -> Tensor:
        ctx.save_for_backward(x)
        return minitorch.tensor([x[0], x[0] * x[1]])
    
    def backward(ctx, d: Tensor) -> Tensor:
        x, = ctx.saved_values
        return minitorch.tensor([d[0] * 1 + d[1] * x[1], d[1] * x[0]])


def label(t, d):
    return vstrut(0.5) // latex(t) // vstrut(0.5) // d


opts = ArrowOpts(arc_height=-0.5)
opts2 = ArrowOpts(arc_height=-0.2)


d = hcat(
    [
        label("$$", matrix(3, 2, "a")),
        left_arrow,
        label("$g'(x)$", matrix(3, 2, "b")),
        label("$d$", matrix(3, 2, "g", colormap=lambda i, j: drawing.papaya)),
    ],
    1,
)
d.connect(("b", 0, 0), ("a", 0, 0), opts2).connect(
    ("b", 1, 0), ("a", 1, 0), opts2
).connect(("g", 0, 0), ("b", 0, 0), opts).connect(("g", 1, 0), ("b", 1, 0), opts)


d = hcat(
    [
        matrix(3, 2, "a1"),
        matrix(3, 2, "a"),
        left_arrow,
        matrix(3, 2, "b"),
        matrix(3, 2, "g", colormap=lambda i, j: drawing.papaya),
    ],
    1,
)
d.connect(("b", 0, 0), ("a", 0, 0), opts).connect(
    ("b", 1, 0), ("a", 1, 0), opts
).connect(("g", 0, 0), ("b", 0, 0), opts)

Module 2.5 - Understanding Gradients¶

Terminology¶

Notation: Gradient¶

General Case¶

Function to Tensor¶

Example: Fun¶

All the derivatives¶

Example: All Derivatives¶

Example: Chain Rule For Gradients¶

Mathematical form: Chain Rule For Gradients¶

Example: Fun Derivatives¶

Implementation¶

Avoiding Gradients¶

Special Function: Map¶

Negation Derivatives¶

Chain Rule¶

Map Gradient¶

Special Function: Zip¶

Multiplication Derivatives¶

Chain Rule¶

Zip Gradient¶

Quiz¶

Puzzles Walkthrough¶

Q&A¶