From afc602b66d941635b4f1e5f91da5dd98a73b83a2 Mon Sep 17 00:00:00 2001
From: Grill cheese <grillcheeseapi@gmail.com>
Date: Mon, 13 Apr 2026 02:40:55 -0400
Subject: [PATCH] Fix Sequential crash when GPU backend is None + update
 train_mlp example
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- containers.py: guard `backend.fnn` access with None check — fixes
  AttributeError on GPUs where `_get_backend()` returns None (e.g. RADV VEGA20)
- train_mlp.py: reduce dataset from 25600×100 to 512×10 for a fast demo,
  bump lr from 1e-5 to 1e-3 so loss visibly drops in 10 epochs

Closes #38

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 examples/train_mlp.py | 10 +++++-----
 nn/containers.py      |  2 +-
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/examples/train_mlp.py b/examples/train_mlp.py
index 1d0753d..4beb0d4 100644
--- a/examples/train_mlp.py
+++ b/examples/train_mlp.py
@@ -13,16 +13,16 @@
     nn.Linear(64, 10),
 )
 
-optimizer = optim.AdamW(model.parameters(), lr=1e-5)
+optimizer = optim.AdamW(model.parameters(), lr=1e-3)
 loss_fn = nn.CrossEntropyLoss()
 
-# Synthetic dataset: 256 samples, 10 classes
+# Synthetic dataset: 512 samples, 10 classes
 np.random.seed(42)
-X = np.random.randn(25600, 64).astype(np.float32)
-y = np.random.randint(0, 10, size=25600)
+X = np.random.randn(512, 64).astype(np.float32)
+y = np.random.randint(0, 10, size=512)
 
 batch_size = 32
-epochs = 100
+epochs = 10
 
 for epoch in range(epochs):
     epoch_loss = 0.0
diff --git a/nn/containers.py b/nn/containers.py
index ffd9fc1..c9ec59a 100644
--- a/nn/containers.py
+++ b/nn/containers.py
@@ -85,7 +85,7 @@ def forward(self, x: np.ndarray) -> np.ndarray:
                 weight = _get_param_array(linear_mod.weight)
                 bias = _get_param_array(linear_mod.bias) if linear_mod.bias is not None else None
                 backend = linear_mod._get_backend()
-                fused_fn = getattr(backend.fnn, method_name, None)
+                fused_fn = getattr(backend.fnn, method_name, None) if backend is not None else None
                 if fused_fn is not None:
                     try:
                         current = fused_fn(