open-edge-platform · alexriedel1 · Jun 7, 2026 · Jun 8, 2026 · Jun 8, 2026 · Jun 8, 2026
@@ -43,6 +43,7 @@
     - Reverse Distillation (:class:`anomalib.models.image.ReverseDistillation`)
     - STFPM (:class:`anomalib.models.image.Stfpm`)
     - SuperSimpleNet (:class:`anomalib.models.image.Supersimplenet`)
+    - SuperADD (:class:`anomalib.models.image.SuperADD`)
     - UFlow (:class:`anomalib.models.image.Uflow`)
     - UniNet (:class:`anomalib.models.image.UniNet`)
     - VLM-AD (:class:`anomalib.models.image.VlmAd`)
@@ -87,6 +88,7 @@
     Patchflow,
     ReverseDistillation,
     Stfpm,
+    SuperADD,
     Supersimplenet,
     Uflow,
     UniNet,
@@ -135,7 +137,9 @@ class UnknownModelError(ModuleNotFoundError):
     "Patchflow",
     "ReverseDistillation",
     "Stfpm",
+    "SuperADD",
     "Supersimplenet",
+    "SuperADD",
     "Uflow",
     "UniNet",
     "VlmAd",

@@ -45,6 +45,7 @@
     - :class:`Patchflow`: Patch Flow
     - :class:`ReverseDistillation`: Reverse Knowledge Distillation
     - :class:`Stfpm`: Student-Teacher Feature Pyramid Matching
+    - :class:`SuperADD`: Supervised Anomaly Detection with Additive Feature Fusion
     - :class:`SuperSimpleNet`: SuperSimpleNet
     - :class:`Uflow`: Unsupervised Flow
     - :class:`UniNet`: Student-Teacher Contrastive Learning Model
@@ -76,6 +77,7 @@
 from .patchflow import Patchflow
 from .reverse_distillation import ReverseDistillation
 from .stfpm import Stfpm
+from .super_add import SuperADD
 from .supersimplenet import Supersimplenet
 from .uflow import Uflow
 from .uninet import UniNet
@@ -108,6 +110,7 @@
     "ReverseDistillation",
     "Stfpm",
     "Supersimplenet",
+    "SuperADD",
     "Uflow",
     "UniNet",
     "VlmAd",

@@ -0,0 +1,32 @@
+# Copyright (C) 2022-2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+"""SuperADD: PatchCore-style anomaly detection on a DINOv3 backbone.
+
+SuperADD is an anomaly detection model that builds a memory bank of patch
+features extracted from a pretrained DINOv3 Vision Transformer. Multi-layer ViT
+token features are computed over overlapping image patches, a per-layer memory
+bank is built from normal training images via distance-based coreset
+subsampling, and test images are scored by nearest-neighbor distance to the
+bank.
+
+Example:
+    >>> from anomalib.data import MVTecAD
+    >>> from anomalib.models import SuperADD
+    >>> from anomalib.engine import Engine
+
+    >>> # Initialize model and data
+    >>> datamodule = MVTecAD()
+    >>> model = SuperADD()
+
+    >>> # Train using the Engine
+    >>> engine = Engine()
+    >>> engine.fit(model=model, datamodule=datamodule)
+
+    >>> # Get predictions
+    >>> predictions = engine.predict(model=model, datamodule=datamodule)
+"""
+
+from .lightning_model import SuperADD
+
+__all__ = ["SuperADD"]
@@ -0,0 +1,292 @@
+# Copyright (C) 2022-2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+"""SuperADD: PatchCore-style anomaly detection on a DINOv3 backbone.
+
+This module provides the Lightning implementation of the SuperADD model. SuperADD
+extracts multi-layer Vision Transformer token features from a pretrained DINOv3
+backbone over overlapping image patches, builds a per-layer memory bank from
+normal training images using distance-based coreset subsampling, and detects
+anomalies by nearest-neighbor search against this memory bank.
+
+Example:
+    >>> from anomalib.data import MVTecAD
+    >>> from anomalib.models import SuperADD
+    >>> from anomalib.engine import Engine
+
+    >>> # Initialize model and data
+    >>> datamodule = MVTecAD()
+    >>> model = SuperADD()
+
+    >>> # Train using the Engine
+    >>> engine = Engine()
+    >>> engine.fit(model=model, datamodule=datamodule)
+
+    >>> # Get predictions
+    >>> predictions = engine.predict(model=model, datamodule=datamodule)
+
+See Also:
+    - :class:`anomalib.models.image.super_add.torch_model.SuperADDModel`:
+        PyTorch implementation of the SuperADD model architecture
+"""
+
+import logging
+from typing import Any
+
+import torch
+from lightning.pytorch.utilities.types import STEP_OUTPUT
+from torch import nn
+from torchvision.transforms.v2 import CenterCrop, Compose, Normalize, Resize
+
+from anomalib import LearningType, PrecisionType
+from anomalib.data import Batch
+from anomalib.metrics import Evaluator
+from anomalib.models.components import AnomalibModule, MemoryBankMixin
+from anomalib.post_processing import PostProcessor
+from anomalib.pre_processing import PreProcessor
+from anomalib.visualization import Visualizer
+
+from .torch_model import SuperADDModel
+
+logger = logging.getLogger(__name__)
+
+
+class SuperADD(MemoryBankMixin, AnomalibModule):
+    """SuperADD Lightning Module for anomaly detection.
+
+    This class implements the SuperADD algorithm, which uses a memory bank of
+    patch features for anomaly detection. Multi-layer token features are
+    extracted from a pretrained DINOv3 Vision Transformer over overlapping image
+    patches and stored in a per-layer memory bank. Anomalies are detected by
+    comparing test image patches against the stored features using nearest
+    neighbor search.
+
+    The model works in two phases:
+    1. Training: Extract and store patch features from normal training images,
+       then build a coreset memory bank.
+    2. Inference: Compare test image patches against the stored features to
+       detect anomalies.
+
+    Args:
+        backbone (str): Name of the timm DINOv3 backbone used for feature
+            extraction. Defaults to ``"vit_huge_plus_patch16_dinov3"``.
+        patch_size (int): Side length (in pixels) of the overlapping patches the
+            input image is split into before being passed to the backbone.
+            Defaults to ``448``.
+        patch_overlap (int): Overlap (in pixels) between neighboring patches.
+            Defaults to ``16``.
+        precision (str | PrecisionType, optional): Precision type for model
+            computations. Can be either a string (``"float32"``, ``"float16"``)
+            or a :class:`PrecisionType` enum value.
+            Defaults to ``PrecisionType.FLOAT32``.
+        pre_processor (nn.Module | bool, optional): Pre-processor instance or
+            bool flag. Defaults to ``True``.
+        post_processor (nn.Module | bool, optional): Post-processor instance or
+            bool flag. Defaults to ``True``.
+        evaluator (Evaluator | bool, optional): Evaluator instance or bool flag.
+            Defaults to ``True``.
+        visualizer (Visualizer | bool, optional): Visualizer instance or bool
+            flag. Defaults to ``True``.
+
+    Raises:
+        ValueError: If an unsupported ``precision`` value is provided.
+
+    Example:
+        >>> from anomalib.data import MVTecAD
+        >>> from anomalib.models import SuperADD
+        >>> from anomalib.engine import Engine
+
+        >>> datamodule = MVTecAD()
+        >>> model = SuperADD()
+
+        >>> engine = Engine()
+        >>> engine.fit(model=model, datamodule=datamodule)
+        >>> predictions = engine.predict(model=model, datamodule=datamodule)
+
+    See Also:
+        - :class:`anomalib.models.image.super_add.torch_model.SuperADDModel`:
+            PyTorch implementation of the SuperADD model
+        - :class:`anomalib.models.components.AnomalibModule`:
+            Base class for all anomaly detection models
+        - :class:`anomalib.models.components.MemoryBankMixin`:
+            Mixin class for models using feature memory banks
+    """
+
+    def __init__(
+        self,
+        backbone: str = "vit_huge_plus_patch16_dinov3",
+        patch_size: int = 448,
+        patch_overlap: int = 16,
+        precision: str | PrecisionType = PrecisionType.FLOAT32,
+        pre_processor: nn.Module | bool = True,
+        post_processor: nn.Module | bool = True,
+        evaluator: Evaluator | bool = True,
+        visualizer: Visualizer | bool = True,
+    ) -> None:
+        super().__init__(
+            pre_processor=pre_processor,
+            post_processor=post_processor,
+            evaluator=evaluator,
+            visualizer=visualizer,
+        )
+
+        self.model: SuperADDModel = SuperADDModel(
+            backbone=backbone,
+            patch_size=patch_size,
+            patch_overlap=patch_overlap,
+        )
+
+        if isinstance(precision, str):
+            precision = PrecisionType(precision.lower())
+
+        if precision == PrecisionType.FLOAT16:
+            self.model = self.model.bfloat16()
+        elif precision == PrecisionType.FLOAT32:
+            self.model = self.model.float()
+        else:
+            msg = f"""Unsupported precision type: {precision}.
+            Supported types are: {PrecisionType.FLOAT16}, {PrecisionType.FLOAT32}."""
+            raise ValueError(msg)
+
+    @classmethod
+    def configure_pre_processor(
+        cls,
+        image_size: tuple[int, int] | None = None,
+        center_crop_size: tuple[int, int] | None = None,
+    ) -> PreProcessor:
+        """Configure the default pre-processor for SuperADD.
+
+        If valid center_crop_size is provided, the pre-processor will
+        also perform center cropping, according to the paper.
+
+        Args:
+            image_size (tuple[int, int] | None, optional): Target size for
+                resizing. Defaults to ``(256, 256)``.
+            center_crop_size (tuple[int, int] | None, optional): Size for center
+                cropping. Defaults to ``None``.
+
+        Returns:
+            PreProcessor: Configured pre-processor instance.
+
+        Raises:
+            ValueError: If at least one dimension of ``center_crop_size`` is larger
+                than correspondent ``image_size`` dimension.
+
+        Example:
+            >>> pre_processor = SuperADD.configure_pre_processor(
+            ...     image_size=(256, 256)
+            ... )
+            >>> transformed_image = pre_processor(image)
+        """
+        image_size = image_size or (448, 448)
+
+        if center_crop_size is not None:
+            if center_crop_size[0] > image_size[0] or center_crop_size[1] > image_size[1]:
+                msg = f"Center crop size {center_crop_size} cannot be larger than image size {image_size}."
+                raise ValueError(msg)
+            transform = Compose([
+                Resize(image_size, antialias=True),
+                CenterCrop(center_crop_size),
+                Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
+            ])
+        else:
+            transform = Compose([
+                Resize(image_size, antialias=True),
+                Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
+            ])
+
+        return PreProcessor(transform=transform)
+
+    @staticmethod
+    def configure_optimizers() -> None:
+        """Configure optimizers.
+
+        Returns:
+            None: SuperADD requires no optimization.
+        """
+        return
+
+    def training_step(self, batch: Batch, *args, **kwargs) -> None:
+        """Generate feature embedding of the batch.
+
+        Args:
+            batch (Batch): Input batch containing image and metadata
+            *args: Additional arguments (unused)
+            **kwargs: Additional keyword arguments (unused)
+
+        Returns:
+            torch.Tensor: Dummy loss tensor for Lightning compatibility
+
+        Note:
+            The method stores embeddings in ``self.embeddings`` for later use in
+            ``fit()``.
+        """
+        del args, kwargs  # These variables are not used.
+        _ = self.model(batch.image)
+        # Return a dummy loss tensor
+        return torch.tensor(0.0, requires_grad=True, device=self.device)
+
+    def fit(self) -> None:
+        """Apply subsampling to the embedding collected from the training set.
+
+        This method:
+        1. Applies coreset subsampling to reduce memory requirements
+        """
+        logger.info("Applying core-set subsampling to get the embedding.")
+        self.model.subsample_embedding()
+
+    def validation_step(self, batch: Batch, *args, **kwargs) -> STEP_OUTPUT:
+        """Generate predictions for a batch of images.
+
+        Args:
+            batch (Batch): Input batch containing images and metadata
+            *args: Additional arguments (unused)
+            **kwargs: Additional keyword arguments (unused)
+
+        Returns:
+            STEP_OUTPUT: Batch with added predictions
+
+        Note:
+            Predictions include anomaly maps and scores computed using nearest
+            neighbor search.
+        """
+        # These variables are not used.
+        del args, kwargs
+
+        # Get anomaly maps and predicted scores from the model.
+        predictions = self.model(batch.image)
+
+        return batch.update(**predictions._asdict())
+
+    @property
+    def trainer_arguments(self) -> dict[str, Any]:
+        """Get default trainer arguments for SuperADD.
+
+        Returns:
+            dict[str, Any]: Trainer arguments
+                - ``gradient_clip_val``: ``0`` (no gradient clipping needed)
+                - ``max_epochs``: ``1`` (single pass through training data)
+                - ``num_sanity_val_steps``: ``0`` (skip validation sanity checks)
+                - ``devices``: ``1`` (only single gpu supported)
+        """
+        return {"gradient_clip_val": 0, "max_epochs": 1, "num_sanity_val_steps": 0, "devices": 1}
+
+    @property
+    def learning_type(self) -> LearningType:
+        """Get the learning type.
+
+        Returns:
+            LearningType: Always ``LearningType.ONE_CLASS`` as SuperADD only
+                trains on normal samples
+        """
+        return LearningType.ONE_CLASS
+
+    @staticmethod
+    def configure_post_processor() -> PostProcessor:
+        """Configure the default post-processor.
+
+        Returns:
+            PostProcessor: Post-processor for one-class models that
+                converts raw scores to anomaly predictions
+        """
+        return PostProcessor()