AI-ModCon · anagainaru · Mar 2, 2026 · Mar 2, 2026 · Mar 2, 2026 · Mar 3, 2026
diff --git a/examples/aeris/__init__.py b/examples/aeris/__init__.py
diff --git a/examples/aeris/aeris.toml b/examples/aeris/aeris.toml
@@ -0,0 +1,53 @@
+# aeris.toml  —  AERIS continuous-learning
+seed = 42
+device = "auto"
+multi_gpu = false
+verbosity = "INFO:2"
+
+[model]
+name = "aeris_model.pt"
+pretrained_path = "examples/aeris/model"
+
+[data]
+name = "aeris_dataset.csv"
+path = "examples/aeris/data"
+batch_size = 1
+
+[train]
+batch_size = 256
+num_workers = 4
+init_lr = 1e-3
+max_iter = 100
+grad_accumulation_steps = 1
+
+[continual_learning]
+update_mode = "base"
+
+# JVP regularization (used when update_mode = "jvp_reg")
+jvp_lambda = 10
+jvp_deltax_norm = 1
+
+# EWC (used when update_mode = "ewc_online")
+ewc_lambda = 1000.0
+ewc_ema_decay = 0.95
+
+# KFAC (used when update_mode = "kfac_online")
+kfac_lambda = 1e-2
+kfac_ema_decay = 0.95
+
+[drift_detection]
+detector_name = "ADWINDetector"
+detection_interval = 1
+aggregation = "mean"
+metric_index = 0
+reset_after_learning = false
+max_stream_updates = 250
+
+# ADWIN hyperparameters
+adwin_delta = 0.2
+adwin_minor_threshold = 0.1
+adwin_moderate_threshold = 0.6
+
+[logging]
+backend = "wandb"
+experiment_name = "aeris-cl"
diff --git a/examples/aeris/model.py b/examples/aeris/model.py
@@ -0,0 +1,196 @@
+# examples/aeris/model.py
+"""AERIS model harness for the BaseSim continuous-learning framework.
+
+This harness wraps a 8-layer neural network trained to predict enthalpy per atom from a given fuel material."""
+
+import gc
+import torch
+import numpy as np
+from typing import Tuple, Optional, List, Any, Mapping, cast
+from torch import nn, Tensor
+from torch.optim import Optimizer
+from torch.utils.data import DataLoader, ConcatDataset, TensorDataset
+
+from model.torch_model_harness import BaseModelHarness
+from config.configuration import Config
+
+from examples.aeris.utils import (
+    load_datasets,
+    make_loader,
+    load_pretrained_model,
+    split_into_windows,
+)
+
+# Aeris model architecture used for prediction
+class AerisFullStructure(nn.Module):
+    def __init__(self, input_dim, dropout=0.3):
+        super().__init__()
+        first_layer = min(1024, max(512, input_dim * 2))
+        self.layers = nn.Sequential(
+            nn.Linear(input_dim, first_layer), nn.ReLU(), nn.BatchNorm1d(first_layer),
+            nn.Linear(first_layer, first_layer), nn.ReLU(), nn.Dropout(dropout),
+            nn.Linear(first_layer, 512), nn.ReLU(), nn.BatchNorm1d(512),
+            nn.Linear(512, 512), nn.ReLU(), nn.Dropout(dropout),
+            nn.Linear(512, 256), nn.ReLU(), nn.BatchNorm1d(256),
+            nn.Linear(256, 256), nn.ReLU(), nn.Dropout(dropout),
+            nn.Linear(256, 128), nn.ReLU(), nn.BatchNorm1d(128),
+            nn.Linear(128, 64), nn.ReLU(), nn.Dropout(dropout),
+            nn.Linear(64, 32), nn.ReLU(), nn.Linear(32, 1)
+        )
+
+    def forward(self, x):
+        return self.layers(x)
+
+
+# Fraction of each time window reserved for validation
+_VAL_FRACTION: float = 0.2
+
+
+class AERIS(BaseModelHarness):
+    """
+    Continuous-learning harness for the AERIS prediction model.
+    """
+
+    def __init__(self, cfg: Config):
+        # ----- build model ---------------------------------------------------
+        ckpt = load_pretrained_model(
+            cfg.model.pretrained_path, cfg.model.name, device=cfg.device
+        )
+        feature_names: List[str] = ckpt["feature_names"]
+        scaler = ckpt["scaler"]
+        input_dim = int(ckpt["input_dim"])
+
+        model = AerisFullStructure(input_dim=input_dim)
+        model.load_state_dict(ckpt["model_state_dict"])
+        model.to(cfg.device)
+        model.eval()
+
+        super().__init__(cfg=cfg, model=model)
+
+        # ----- eval metrics (prediction) -------------------------------------
+        self.eval_metrics = {"mae": self.mae_metric(), "loss": self.get_criterion()}
+        self.higher_is_better = {"accuracy": False, "loss": False}
+
+        # ----- data loaders  -------------------------------------
+        X, y = load_datasets(cfg.data.path, cfg.data.name, feature_names, input_dim)
+        # X shape: (n_samples, 245) y shape: (n_samples,1)
+
+        # scale (must match training)
+        X_scaled = scaler.transform(X).astype(np.float32)
+        X_tensor = torch.tensor(X_scaled, dtype=torch.float32)
+        y_tensor = torch.tensor(y, dtype=torch.float32)
+
+        self.windows = split_into_windows(X_tensor, y_tensor)
+        print(f"Prepared {len(self.windows)} time windows for streaming. Each window has ~{self.windows[0][0].shape[0]} samples.")
+
+        # ----- streaming state -----------------------------------------------
+        self.window_idx: int = 0
+        self.history_windows: List[Tuple[Tensor, Tensor]] = []
+
+        self._cur_train_loader: Optional[DataLoader] = None
+        self._cur_val_loader: Optional[DataLoader] = None
+
+    def get_optmizer(self) -> Optimizer:  # noqa: D102  (spelling kept for ABC)
+        return torch.optim.Adam(self.model.parameters(), lr=self.cfg.train.init_lr)
+
+    def get_criterion(self):  # noqa: D102
+        return nn.MSELoss()
+
+    def mae_metric(self):
+        return nn.L1Loss()
+
+    def get_cur_data_loaders(self) -> Tuple[DataLoader, DataLoader]:  # noqa: D102
+        assert self._cur_train_loader is not None and self._cur_val_loader is not None
+        return self._cur_train_loader, self._cur_val_loader
+
+    def get_hist_data_loaders(
+        self,
+    ) -> Tuple[Optional[DataLoader], Optional[DataLoader]]:
+        """Return loaders over all previously-seen time windows.
+
+        Returns ``(None, None)`` until at least two windows have been served.
+        """
+        if self.window_idx <= 1:
+            return None, None
+
+        # Concatenate all history windows
+        hist_train_views: List[TensorDataset] = []
+        hist_val_views: List[TensorDataset] = []
+
+        for X_w, y_w in self.history_windows:
+            n = X_w.shape[0]
+            n_val = max(1, int(n * _VAL_FRACTION))
+            n_train = n - n_val
+            hist_train_views.append(TensorDataset(X_w[:n_train], y_w[:n_train]))
+            hist_val_views.append(TensorDataset(X_w[n_train:], y_w[n_train:]))
+
+        ds_hist_train: ConcatDataset[Any] = ConcatDataset(hist_train_views)
+        ds_hist_val: ConcatDataset[Any] = ConcatDataset(hist_val_views)
+
+        bs = self.cfg.train.batch_size
+        nw = self.cfg.train.num_workers
+        pin = torch.cuda.is_available()
+        return (
+            make_loader(
+                ds_hist_train, bs, shuffle=True, num_workers=nw, pin_memory=pin
+            ),
+            make_loader(ds_hist_val, bs, shuffle=False, num_workers=nw, pin_memory=pin),
+        )
+
+    def update_data_stream(self) -> None:
+        """Advance to the next chronological time window.
+
+        The current window is added to the history, and new train/val loaders
+        are built from the upcoming window.
+        """
+        self._dispose_current_loaders()
+
+        if self.window_idx >= len(self.windows):
+            print(
+                f"Warning: All {len(self.windows)} time windows exhausted; "
+                "wrapping around to the first window."
+            )
+            self.window_idx = 0
+
+        X_w, y_w = self.windows[self.window_idx]
+
+        # Archive previous window in history (skip the very first call)
+        if self.window_idx > 0:
+            prev_X, prev_y = self.windows[self.window_idx - 1]
+            # Only add if not already stored (idempotency guard)
+            if len(self.history_windows) < self.window_idx:
+                self.history_windows.append((prev_X, prev_y))
+        # Train / val split (last _VAL_FRACTION chronologically)
+        n = X_w.shape[0]
+        n_val = max(1, int(n * _VAL_FRACTION))
+        n_train = n - n_val
+
+        ds_train = TensorDataset(X_w[:n_train], y_w[:n_train])
+        ds_val = TensorDataset(X_w[n_train:], y_w[n_train:])
+        #print(f"Window {self.window_idx}: {n_train} train samples, {n_val} val samples.")
+        #print(len(ds_train), len(ds_val))
+
+        bs = self.cfg.train.batch_size
+        nw = self.cfg.train.num_workers
+        pin = torch.cuda.is_available()
+
+        self._cur_train_loader = make_loader(
+            ds_train, bs, shuffle=True, num_workers=nw, pin_memory=pin
+        )
+        self._cur_val_loader = make_loader(
+            ds_val, bs, shuffle=False, num_workers=nw, pin_memory=pin
+        )
+
+        self.window_idx += 1
+
+    # --------------------------------------------------------------------- #
+    # Helpers
+    # --------------------------------------------------------------------- #
+    def _dispose_current_loaders(self) -> None:
+        if self._cur_train_loader is not None:
+            del self._cur_train_loader
+            self._cur_train_loader = None
+        if self._cur_val_loader is not None:
+            del self._cur_val_loader
+            self._cur_val_loader = None
+        gc.collect()