facebookresearch · JasonKChow · Apr 29, 2025 · Apr 29, 2025 · Apr 29, 2025
diff --git a/aepsych/config.py b/aepsych/config.py
@@ -239,8 +239,16 @@ def update(
                     # Validate the parameter-specific block
                     self._check_param_settings(par_name)
 
-                    lb[i] = self[par_name].get("lower_bound", fallback="0")
-                    ub[i] = self[par_name].get("upper_bound", fallback="1")
+                    if self[par_name]["par_type"] == "categorical":
+                        raise NotImplementedError(
+                            "Categorical parameters not supported yet"
+                        )
+                        choices = self.getlist(par_name, "choices", element_type=str)
+                        lb[i] = "0"
+                        ub[i] = str(len(choices) - 1)
+                    else:
+                        lb[i] = self[par_name].get("lower_bound", fallback="0")
+                        ub[i] = self[par_name].get("upper_bound", fallback="1")
 
                 self["common"]["lb"] = f"[{', '.join(lb)}]"
                 self["common"]["ub"] = f"[{', '.join(ub)}]"
@@ -397,6 +405,12 @@ def _check_param_settings(self, param_name: str) -> None:
                     f"Parameter {param_name} is fixed and needs to have value set."
                 )
 
+        elif param_block["par_type"] == "categorical":
+            # Need a choices array
+            if "choices" not in param_block:
+                raise ValueError(
+                    f"Parameter {param_name} is missing the choices setting."
+                )
         else:
             raise ParameterConfigError(
                 f"Parameter {param_name} has an unsupported parameter type {param_block['par_type']}."

diff --git a/aepsych/models/inducing_points/__init__.py b/aepsych/models/inducing_points/__init__.py
@@ -8,12 +8,14 @@
 import sys
 
 from ...config import Config
+from .data import DataAllocator
 from .fixed import FixedAllocator, FixedPlusAllocator
 from .greedy_variance_reduction import GreedyVarianceReduction
 from .kmeans import KMeansAllocator
 from .sobol import SobolAllocator
 
 __all__ = [
+    "DataAllocator",
     "FixedAllocator",
     "FixedPlusAllocator",
     "GreedyVarianceReduction",

diff --git a/aepsych/models/inducing_points/base.py b/aepsych/models/inducing_points/base.py
@@ -13,6 +13,8 @@
 from aepsych.utils import get_dims
 from botorch.models.utils.inducing_point_allocators import InducingPointAllocator
 
+EMPTY_SIZE = torch.Size([])
+
 
 class BaseAllocator(InducingPointAllocator, ConfigurableMixin):
     """Base class for inducing point allocators."""
@@ -34,7 +36,7 @@ def allocate_inducing_points(
         inputs: torch.Tensor | None = None,
         covar_module: torch.nn.Module | None = None,
         num_inducing: int = 100,
-        input_batch_shape: torch.Size = torch.Size([]),
+        input_batch_shape: torch.Size = EMPTY_SIZE,
     ) -> torch.Tensor:
         """
         Abstract method for allocating inducing points. Must replace the

diff --git a/aepsych/models/inducing_points/data.py b/aepsych/models/inducing_points/data.py
@@ -0,0 +1,57 @@
+#!/usr/bin/env python3
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+import warnings
+
+import torch
+from aepsych.models.inducing_points.base import BaseAllocator, EMPTY_SIZE
+
+
+class DataAllocator(BaseAllocator):
+    def __init__(
+        self,
+        dim: int,
+    ) -> None:
+        """Initialize the DataAllocator. This allocator simply returns the input
+        data to use as the inducing points.
+
+        Args:
+            dim (int): Dimensionality of the search space.
+        """
+        super().__init__(dim=dim)
+
+    def allocate_inducing_points(
+        self,
+        inputs: torch.Tensor | None = None,
+        covar_module: torch.nn.Module | None = None,
+        num_inducing: int = 100,
+        input_batch_shape: torch.Size = EMPTY_SIZE,
+    ) -> torch.Tensor:
+        """Allocate inducing points by returning the inputs as the inducing points.
+
+        Args:
+            inputs (torch.Tensor): Input tensor, cloned and returned as inducing points.
+            covar_module (torch.nn.Module, optional): Kernel covariance module; included for API compatibility, but not used here.
+            num_inducing (int, optional): The number of inducing points to generate. This parameter is ignored by DataAllocator,
+                which always returns all input points.
+            input_batch_shape (torch.Size, optional): Batch shape; included for API compatibility, but not used here.
+
+        Returns:
+            torch.Tensor: The input data as inducing points.
+        """
+        if inputs is None:  # Dummy points
+            return self._allocate_dummy_points(num_inducing=num_inducing)
+
+        if num_inducing < inputs.shape[0]:
+            warnings.warn(
+                f"DataAllocator ignores num_inducing={num_inducing} and returns all input points.",
+                UserWarning,
+                stacklevel=2,
+            )
+
+        self.last_allocator_used = self.__class__
+        return inputs.clone().detach()
diff --git a/aepsych/models/inducing_points/fixed.py b/aepsych/models/inducing_points/fixed.py
@@ -8,7 +8,7 @@
 from typing import Any
 
 import torch
-from aepsych.models.inducing_points.base import BaseAllocator
+from aepsych.models.inducing_points.base import BaseAllocator, EMPTY_SIZE
 
 
 class FixedAllocator(BaseAllocator):
@@ -31,7 +31,7 @@ def allocate_inducing_points(
         inputs: torch.Tensor | None = None,
         covar_module: torch.nn.Module | None = None,
         num_inducing: int = 100,
-        input_batch_shape: torch.Size = torch.Size([]),
+        input_batch_shape: torch.Size = EMPTY_SIZE,
     ) -> torch.Tensor:
         """Allocate inducing points by returning the fixed inducing points.
 
@@ -93,7 +93,7 @@ def allocate_inducing_points(
         inputs: torch.Tensor | None = None,
         covar_module: torch.nn.Module | None = None,
         num_inducing: int = 100,
-        input_batch_shape: torch.Size = torch.Size([]),
+        input_batch_shape: torch.Size = EMPTY_SIZE,
     ) -> torch.Tensor:
         points = self.main_allocator.allocate_inducing_points(
             inputs=inputs,

diff --git a/aepsych/models/inducing_points/greedy_variance_reduction.py b/aepsych/models/inducing_points/greedy_variance_reduction.py
@@ -6,7 +6,7 @@
 # LICENSE file in the root directory of this source tree.
 
 import torch
-from aepsych.models.inducing_points.base import BaseAllocator
+from aepsych.models.inducing_points.base import BaseAllocator, EMPTY_SIZE
 from botorch.models.utils.inducing_point_allocators import (
     GreedyVarianceReduction as BaseGreedyVarianceReduction,
 )
@@ -18,7 +18,7 @@ def allocate_inducing_points(
         inputs: torch.Tensor | None = None,
         covar_module: torch.nn.Module | None = None,
         num_inducing: int = 100,
-        input_batch_shape: torch.Size = torch.Size([]),
+        input_batch_shape: torch.Size = EMPTY_SIZE,
     ) -> torch.Tensor:
         """Allocate inducing points using the GreedyVarianceReduction strategy. This is
         a thin wrapper around BoTorch's GreedyVarianceRedution inducing point allocator.

diff --git a/aepsych/models/inducing_points/kmeans.py b/aepsych/models/inducing_points/kmeans.py
@@ -6,7 +6,7 @@
 # LICENSE file in the root directory of this source tree.
 
 import torch
-from aepsych.models.inducing_points.base import BaseAllocator
+from aepsych.models.inducing_points.base import BaseAllocator, EMPTY_SIZE
 from scipy.cluster.vq import kmeans2
 
 
@@ -18,7 +18,7 @@ def allocate_inducing_points(
         inputs: torch.Tensor | None = None,
         covar_module: torch.nn.Module | None = None,
         num_inducing: int = 100,
-        input_batch_shape: torch.Size = torch.Size([]),
+        input_batch_shape: torch.Size = EMPTY_SIZE,
     ) -> torch.Tensor:
         """
         Generates `num_inducing` inducing points using k-means++ initialization on the input data.

diff --git a/aepsych/models/inducing_points/sobol.py b/aepsych/models/inducing_points/sobol.py
@@ -9,7 +9,7 @@
 
 import torch
 from aepsych.config import Config
-from aepsych.models.inducing_points.base import BaseAllocator
+from aepsych.models.inducing_points.base import BaseAllocator, EMPTY_SIZE
 from botorch.utils.sampling import draw_sobol_samples
 
 
@@ -36,7 +36,7 @@ def allocate_inducing_points(
         inputs: torch.Tensor | None = None,
         covar_module: torch.nn.Module | None = None,
         num_inducing: int = 100,
-        input_batch_shape: torch.Size = torch.Size([]),
+        input_batch_shape: torch.Size = EMPTY_SIZE,
     ) -> torch.Tensor:
         """
         Generates `num_inducing` inducing points within the specified bounds using Sobol sampling.

diff --git a/aepsych/transforms/ops/__init__.py b/aepsych/transforms/ops/__init__.py
@@ -5,9 +5,10 @@
 # This source code is licensed under the license found in the
 # LICENSE file in the root directory of this source tree.
 
+from .categorical import Categorical
 from .fixed import Fixed
 from .log10_plus import Log10Plus
 from .normalize_scale import NormalizeScale
 from .round import Round
 
-__all__ = ["Log10Plus", "NormalizeScale", "Round", "Fixed"]
+__all__ = ["Categorical", "Fixed", "Log10Plus", "NormalizeScale", "Round"]
diff --git a/aepsych/transforms/ops/categorical.py b/aepsych/transforms/ops/categorical.py
@@ -0,0 +1,97 @@
+#!/usr/bin/env python3
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+from typing import Any
+
+import torch
+from aepsych.config import Config
+from aepsych.transforms.ops.base import StringParameterMixin, Transform
+
+
+class Categorical(Transform, StringParameterMixin):
+    # These attributes do nothing here but ensures compat.
+    is_one_to_many = False
+    transform_on_train = True
+    transform_on_eval = True
+    transform_on_fantasize = True
+    training = True
+    reverse = False
+
+    def __init__(
+        self,
+        indices: list[int],
+        categories: dict[int, list[str]],
+    ) -> None:
+        """Initialize a categorical transform. The transform itself does not
+        change the tensors. Instead, this class allows passing in NumPy object
+        arrays where the categorical values are stored as strings. This provides
+        a convenient API to turn mixed categorical/continuous data into the
+        expected form for models.
+
+        Args:
+            indices (list[int]): The indices of the inputs that are categorical.
+            categories (dict[int, list[str]]): A dictionary mapping indices to
+                the list of categories for that input. There must be a list for
+                each index in `indices`.
+        """
+        self.indices = indices
+        self.categories = categories
+        self.string_map = self.categories
+
+    def _transform(self, X: torch.Tensor) -> torch.Tensor:
+        r"""This is a no-op as these transforms should be acting on indices
+        already.
+
+        Args:
+            X (torch.Tensor): A `batch_shape x n x d`-dim tensor of inputs.
+
+        Returns:
+            torch.Tensor: The input tensor.
+        """
+        return X
+
+    def _untransform(self, X: torch.Tensor) -> torch.Tensor:
+        r"""This is a no-op as these transforms should be acting on indices
+        already.
+
+        Args:
+            X (torch.Tensor): A `batch_shape x n x d`-dim tensor of transformed inputs.
+
+        Returns:
+            torch.Tensor: The input tensor.
+        """
+        return X
+
+    @classmethod
+    def get_config_options(
+        cls,
+        config: Config,
+        name: str | None = None,
+        options: dict[str, Any] | None = None,
+    ) -> dict[str, Any]:
+        """Return a dictionary of the relevant options to initialize a Fixed parameter
+        transform for the named parameter within the config.
+
+        Args:
+            config (Config): Config to look for options in.
+            name (str, optional): Parameter to find options for.
+            options (Dict[str, Any], optional): Options to override from the config.
+
+        Returns:
+            Dict[str, Any]: A dictionary of options to initialize this class with,
+                including the transformed bounds.
+        """
+        options = super().get_config_options(config=config, name=name, options=options)
+
+        if name is None:
+            raise ValueError(f"{name} must be set to initialize a transform.")
+
+        if "categories" not in options:
+            idx = options["indices"][0]  # There should only be one index
+            cat_dict = {idx: config.getlist(name, "categories", element_type=str)}
+            options["categories"] = cat_dict
+
+        return options
diff --git a/aepsych/transforms/parameters.py b/aepsych/transforms/parameters.py
@@ -16,7 +16,7 @@
 from aepsych.config import Config, ConfigurableMixin
 from aepsych.generators.base import AcqfGenerator, AEPsychGenerator
 from aepsych.models.base import AEPsychModelMixin
-from aepsych.transforms.ops import Fixed, Log10Plus, NormalizeScale, Round
+from aepsych.transforms.ops import Categorical, Fixed, Log10Plus, NormalizeScale, Round
 from aepsych.transforms.ops.base import Transform
 from aepsych.utils import get_bounds
 from botorch.acquisition import AcquisitionFunction
@@ -61,7 +61,7 @@ def __init__(
                     for key in transform.string_map.keys():
                         if key in fixed_string_map:
                             raise RuntimeError(
-                                "Conflicting string maps between the Fixed transforms, each parameter can only have a single string map."
+                                "Conflicting string maps between the string transforms, each parameter can only have a single string map."
                             )
 
                     fixed_string_map.update(transform.string_map)
@@ -145,8 +145,9 @@ def transform_bounds(
     ) -> torch.Tensor:
         r"""Transform bounds of a parameter.
 
-        Individual transforms are applied in sequence. Then an adjustment is applied to
-        ensure the bounds are correct.
+        Individual transforms are applied in sequence. Looks for a specific
+        transform_bounds method in each transform to apply that, otherwise uses the
+        normal transform.
 
         Args:
             X (torch.Tensor): A tensor of inputs. Either `[dim]` or `[2, dim]`.
@@ -255,14 +256,23 @@ def get_config_options(
                 )
                 transform_dict[f"{par}_Round"] = round
 
-            if par_type == "fixed":
+            elif par_type == "fixed":
                 fixed = Fixed.from_config(
                     config=config, name=par, options=transform_options
                 )
 
                 # We don't mess with bounds since we don't want to modify indices
                 transform_dict[f"{par}_Fixed"] = fixed
 
+            # Categorical variable
+            elif par_type == "categorical":
+                categorical = Categorical.from_config(
+                    config=config, name=par, options=transform_options
+                )
+
+                transform_dict[f"{par}_Categorical"] = categorical
+                continue  # Prevents log-scaling or normalizing
+
             # Log scale
             if config.getboolean(par, "log_scale", fallback=False):
                 log10 = Log10Plus.from_config(