Autograd MLP: Neural Network with Automatic Differentiation

hard · autograd, neural-networks, training

Autograd MLP: Neural Network with Automatic Differentiation

Use your Value class to build and train a small multi-layer perceptron (MLP). This is the capstone for the autograd module.

What you are building

1) `Neuron`

Parameters: weights w (list of Value), bias b (Value)
Activation: "tanh", "relu", or "linear"

class Neuron:
    def __init__(self, nin: int, activation: str = "tanh"):
        # initialize w with random Values in [-1, 1]
        # initialize b = Value(0.0)
        pass

    def __call__(self, x: List[Value]) -> Value:
        # act = sum(w_i * x_i) + b
        # apply activation
        pass

    def parameters(self) -> List[Value]:
        pass

2) `Layer`

A list of nout neurons

class Layer:
    def __init__(self, nin: int, nout: int, activation: str = "tanh"):
        pass

    def __call__(self, x: List[Value]) -> List[Value]:
        pass

    def parameters(self) -> List[Value]:
        pass

3) `MLP`

Stack multiple layers
Default activations: tanh for hidden layers, linear for output
Accept input as List[float] or List[Value]

class MLP:
    def __init__(self, nin: int, nouts: List[int], activations: List[str] | None = None):
        pass

    def __call__(self, x: List[float] | List[Value]) -> Value | List[Value]:
        pass

    def parameters(self) -> List[Value]:
        pass

4) `train(model, X, y, epochs, lr)`

Train with mean squared error (MSE)
Return a list of loss values (floats), one per epoch

def train(model, X, y, epochs, lr) -> List[float]:
    # preds = [model(xi) for xi in X]
    # loss = mean((pred - target)^2)
    # backward + SGD update
    pass

Notes

Use += in _backward paths so gradients accumulate correctly.
Zero parameter gradients before each backward.
If a layer has one output, return a single Value instead of a length-1 list.

Example

model = MLP(2, [4, 1])
losses = train(model, X=[[0,0],[0,1],[1,0],[1,1]], y=[0,1,1,0], epochs=50, lr=0.1)
print(losses[-1])

from __future__ import annotations
import math
import random
from typing import List, Callable, Set, Tuple

class Value:
    """Complete Value class with autograd support."""

def __init__(
        self,
        data: float,
        _children: Tuple["Value", ...] = (),
        _op: str = "",
    ) -> None:
        self.data = float(data)
        self.grad = 0.0
        self._backward: Callable[[], None] = lambda: None
        self._prev: Set["Value"] = set(_children)
        self._op = _op

def __repr__(self) -> str:
        return f"Value(data={self.data:.4f}, grad={self.grad:.4f})"

def __add__(self, other: "Value | float | int") -> "Value":
        other = other if isinstance(other, Value) else Value(other)
        out = Value(self.data + other.data, (self, other), "+")

def _backward() -> None:
            self.grad += 1.0 * out.grad
            other.grad += 1.0 * out.grad

out._backward = _backward
        return out

def __mul__(self, other: "Value | float | int") -> "Value":
        other = other if isinstance(other, Value) else Value(other)
        out = Value(self.data * other.data, (self, other), "*")

def _backward() -> None:
            self.grad += other.data * out.grad
            other.grad += self.data * out.grad

out._backward = _backward
        return out

def __pow__(self, n: float | int) -> "Value":
        out = Value(self.data**n, (self,), f"**{n}")

def _backward() -> None:
            self.grad += n * (self.data ** (n - 1)) * out.grad

out._backward = _backward
        return out

def __neg__(self) -> "Value":
        return self * -1

def __sub__(self, other: "Value | float | int") -> "Value":
        return self + (-other)

def __truediv__(self, other: "Value | float | int") -> "Value":
        return self * other**-1

def __radd__(self, other: float | int) -> "Value":
        return self + other

def __rmul__(self, other: float | int) -> "Value":
        return self * other

def __rsub__(self, other: float | int) -> "Value":
        return Value(other) + (-self)

def __rtruediv__(self, other: float | int) -> "Value":
        return Value(other) * self**-1

def backward(self) -> None:
        topo = []
        visited = set()

def build_topo(v: "Value") -> None:
            if v not in visited:
                visited.add(v)
                for child in v._prev:
                    build_topo(child)
                topo.append(v)

build_topo(self)
        self.grad = 1.0
        for node in reversed(topo):
            node._backward()

def tanh(self) -> "Value":
        t = math.tanh(self.data)
        out = Value(t, (self,), "tanh")

def _backward() -> None:
            self.grad += (1 - t**2) * out.grad

out._backward = _backward
        return out

def relu(self) -> "Value":
        out = Value(max(0.0, self.data), (self,), "relu")

def _backward() -> None:
            self.grad += (1.0 if self.data > 0 else 0.0) * out.grad

out._backward = _backward
        return out

class Neuron:
    """TODO: Implement a single neuron."""

def __init__(self, nin: int, activation: str = "tanh") -> None:
        """Initialize neuron with nin inputs and specified activation."""
        raise NotImplementedError()

def __call__(self, x: List[Value]) -> Value:
        """Forward pass: compute activation(sum(w*x) + b)."""
        raise NotImplementedError()

def parameters(self) -> List[Value]:
        """Return all trainable parameters."""
        raise NotImplementedError()

class Layer:
    """TODO: Implement a layer of neurons."""

def __init__(self, nin: int, nout: int, activation: str = "tanh") -> None:
        """Initialize layer with nin inputs and nout neurons."""
        raise NotImplementedError()

def __call__(self, x: List[Value]) -> List[Value]:
        """Forward pass through all neurons."""
        raise NotImplementedError()

def parameters(self) -> List[Value]:
        """Return all trainable parameters from all neurons."""
        raise NotImplementedError()

class MLP:
    """TODO: Implement a multi-layer perceptron."""

def __init__(
        self,
        nin: int,
        nouts: List[int],
        activations: List[str] | None = None,
    ) -> None:
        """Initialize MLP with given architecture."""
        raise NotImplementedError()

def __call__(self, x: List[float] | List[Value]) -> Value | List[Value]:
        """Forward pass through all layers."""
        raise NotImplementedError()

def parameters(self) -> List[Value]:
        """Return all trainable parameters from all layers."""
        raise NotImplementedError()

def train(
    model: MLP,
    X: List[List[float]],
    y: List[float],
    epochs: int,
    lr: float,
) -> List[float]:
    """TODO: Train the model and return list of losses."""
    raise NotImplementedError()