feat(ocl): add Repeated Augmented Rehearsal (RAR)

tachyonicClock · hmgomes · commit b43c01aa3bd4 · 2025-12-08T11:18:10.000+13:00
diff --git a/.github/workflows/pr.yml b/.github/workflows/pr.yml
@@ -25,7 +25,7 @@ env:
 jobs:
   tests:
     name: "Tests"
-    timeout-minutes: 20
+    timeout-minutes: 30
     runs-on: ubuntu-latest
     strategy:
       fail-fast: true
diff --git a/src/capymoa/ann/_perceptron.py b/src/capymoa/ann/_perceptron.py
@@ -25,6 +25,7 @@ def forward(self, x: Tensor) -> Tensor:
         :param x: Input tensor of shape ``(batch_size, num_features)``.
         :return: Output tensor of shape ``(batch_size, num_classes)``.
         """
+        x = x.view(x.size(0), -1)  # Flatten input
         x = self._fc1(x)
         x = self._relu(x)
         x = self._fc2(x)
diff --git a/src/capymoa/ocl/strategy/__init__.py b/src/capymoa/ocl/strategy/__init__.py
@@ -2,5 +2,6 @@
 from ._slda import SLDA
 from ._ncm import NCM
 from ._gdumb import GDumb
+from ._rar import RAR
 
-__all__ = ["ExperienceReplay", "SLDA", "NCM", "GDumb"]
+__all__ = ["ExperienceReplay", "SLDA", "NCM", "GDumb", "RAR"]
diff --git a/src/capymoa/ocl/strategy/_rar.py b/src/capymoa/ocl/strategy/_rar.py
@@ -0,0 +1,124 @@
+import torch
+from torch import Tensor
+
+from capymoa.base import BatchClassifier
+from capymoa.ocl.util._coreset import ReservoirSampler
+from capymoa.ocl.base import TrainTaskAware, TestTaskAware
+
+from typing import Callable
+
+from torch import nn
+
+
+class RAR(BatchClassifier, TrainTaskAware, TestTaskAware):
+    """Repeated Augmented Rehearsal.
+
+    Repeated Augmented Rehearsal (RAR) [#f0]_ is a replay continual learning
+    strategy that combines data augmentation with repeated training on each
+    batch to mitigate catastrophic forgetting.
+
+    * Coreset Selection: Reservoir sampling is used to select a fixed-size
+      buffer of past examples.
+
+    * Coreset Retrieval: During training, the learner samples uniformly from the
+      buffer of past examples.
+
+    * Coreset Exploitation: The learner trains on the current batch of examples
+      and the sampled buffer examples, performing multiple optimization steps
+      per-batch using random augmentations of the examples.
+
+    * Not :class:`~capymoa.ocl.base.TrainTaskAware` or
+      :class:`~capymoa.ocl.base.TestTaskAware`, but will proxy it to the wrapped
+      learner.
+
+    >>> from capymoa.ann import Perceptron
+    >>> from capymoa.classifier import Finetune
+    >>> from capymoa.ocl.strategy import RAR
+    >>> from capymoa.ocl.datasets import TinySplitMNIST
+    >>> from capymoa.ocl.evaluation import ocl_train_eval_loop
+    >>> import torch
+    >>> _ = torch.manual_seed(0)
+    >>> scenario = TinySplitMNIST()
+    >>> model = Perceptron(scenario.schema)
+    >>> learner = RAR(Finetune(scenario.schema, model), augment=nn.Dropout(p=0.2), repeats=2)
+    >>> results = ocl_train_eval_loop(
+    ...     learner,
+    ...     scenario.train_loaders(32),
+    ...     scenario.test_loaders(32),
+    ... )
+    >>> print(f"{results.accuracy_final*100:.1f}%")
+    41.5%
+
+    Usually more complex augmentations are used such as random crops and
+    rotations.
+
+    .. [#f0] Zhang, Yaqian, Bernhard Pfahringer, Eibe Frank, Albert Bifet, Nick
+       Jin Sean Lim, and Yunzhe Jia. “A Simple but Strong Baseline for Online
+       Continual Learning: Repeated Augmented Rehearsal.” In Advances in Neural
+       Information Processing Systems 35: Annual Conference on Neural
+       Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA,
+       November 28 - December 9, 2022, edited by Sanmi Koyejo, S. Mohamed, A.
+       Agarwal, Danielle Belgrave, K. Cho, and A. Oh, 2022.
+       https://doi.org/10.5555/3600270.3601344.
+    """
+
+    def __init__(
+        self,
+        learner: BatchClassifier,
+        coreset_size: int = 200,
+        augment: Callable[[Tensor], Tensor] = nn.Identity(),
+        repeats: int = 1,
+    ) -> None:
+        """Initialize Repeated Augmented Rehearsal.
+
+        :param learner: Underlying learner to be trained with RAR.
+        :param coreset_size: Size of the coreset buffer.
+        :param augment: Data augmentation function to apply to the samples. Should take
+            a Tensor of shape ``(batch_size, *schema.shape)`` and return a Tensor of the
+            same shape.
+        :param repeats: Number of times to repeat training on each batch, defaults to 1.
+        """
+
+        super().__init__(learner.schema)
+        num_features = learner.schema.get_num_attributes()
+        self.learner = learner
+        self.augment = augment.to(self.device)
+        self.repeats = repeats
+        self.coreset = ReservoirSampler(
+            coreset_size,
+            num_features,
+            rng=torch.Generator().manual_seed(learner.random_seed),
+        )
+        self.shape = learner.schema.shape
+
+    def train_step(self, x_fresh: Tensor, y_fresh: Tensor) -> None:
+        # Sample from reservoir and augment the data
+        n = x_fresh.shape[0]
+        x_replay, y_replay = self.coreset.sample(n)
+        x = torch.cat((x_fresh, x_replay), dim=0).to(self.device, self.x_dtype)
+        y = torch.cat((y_fresh, y_replay), dim=0).to(self.device, self.y_dtype)
+        x = x.view(-1, *self.shape)
+        x: Tensor = self.augment(x)
+
+        # Train the learner
+        x = x.to(self.learner.device, self.learner.x_dtype)
+        y = y.to(self.learner.device, self.learner.y_dtype)
+        self.learner.batch_train(x, y)
+
+    def batch_train(self, x: Tensor, y: Tensor) -> None:
+        self.coreset.update(x, y)
+        for i in range(self.repeats):
+            self.train_step(x, y)
+
+    @torch.no_grad()
+    def batch_predict_proba(self, x: Tensor) -> Tensor:
+        x = x.to(self.learner.device, self.learner.x_dtype)
+        return self.learner.batch_predict_proba(x)
+
+    def on_test_task(self, task_id: int):
+        if isinstance(self.learner, TestTaskAware):
+            self.learner.on_test_task(task_id)
+
+    def on_train_task(self, task_id: int):
+        if isinstance(self.learner, TrainTaskAware):
+            self.learner.on_train_task(task_id)
diff --git a/tests/ocl/test_strategy.py b/tests/ocl/test_strategy.py
@@ -11,7 +11,7 @@
 from capymoa.classifier import Finetune, HoeffdingTree
 from capymoa.ocl.datasets import TinySplitMNIST
 from capymoa.ocl.evaluation import ocl_train_eval_loop
-from capymoa.ocl.strategy import ExperienceReplay, SLDA, NCM, GDumb
+from capymoa.ocl.strategy import ExperienceReplay, SLDA, NCM, GDumb, RAR
 from capymoa.stream import Schema
 
 import torch
@@ -46,6 +46,15 @@ def pre_processor() -> nn.Module:
     )
 
 
+def _new_rar(schema):
+    # RAR test case constructor
+    return RAR(
+        Finetune(schema, Perceptron(schema)),
+        augment=nn.Dropout(p=0.2),
+        repeats=2,
+    )
+
+
 """
 Add new test cases here.
 
@@ -55,6 +64,7 @@ def pre_processor() -> nn.Module:
 TEST_CASES: List[Case] = [
     Case("HoeffdingTree", HoeffdingTree, Result(59.49, 42.59, 45.8), batch_size=1),
     Case("HoeffdingTree", HoeffdingTree, Result(59.00, 42.80, 42.5), batch_size=32),
+    Case("RAR", _new_rar, Result(41.50, 28.20, 8.20)),
     Case(
         "Finetune",
         partial(Finetune, model=Perceptron),
@@ -92,7 +102,12 @@ def test_ocl_classifier(case: Case):
     if os.environ.get("CI") == "true" and "SLDA" in case.name:
         pytest.skip("Skipping SLDA case on CI due to unreliable dataset download")
     scenario = TinySplitMNIST()
+
+    # Set random seeds for reproducibility
     torch.manual_seed(0)
+    np.random.seed(0)
+    torch.use_deterministic_algorithms(True)
+
     learner = case.constructor(scenario.schema)
     r = ocl_train_eval_loop(
         learner,