Implement Chebyshev center fallback for center node (#4477)

mgarrard · facebook-github-bot · commit c62f3fdf064b · 2026-01-09T10:52:44.000-08:00
Summary:

This diff implements Chebyshev center if naive centering fails due to violation of parameter constraints.

Reviewed By: sdaulton

Differential Revision: D85712042
diff --git a/ax/core/search_space.py b/ax/core/search_space.py
@@ -8,11 +8,15 @@
 
 from __future__ import annotations
 
+import math
+
 import warnings
 from collections.abc import Mapping, Sequence
 from dataclasses import dataclass, field
 from logging import Logger
 
+import numpy as np
+
 import pandas as pd
 from ax import core
 from ax.core.arm import Arm
@@ -36,6 +40,9 @@
 from ax.utils.common.constants import Keys
 from ax.utils.common.logger import get_logger
 from pyre_extensions import none_throws
+from scipy.optimize import linprog
+
+from scipy.special import expit, logit
 
 
 logger: Logger = get_logger(__name__)
@@ -572,6 +579,134 @@ def clone(self) -> SearchSpace:
             parameter_constraints=[pc.clone() for pc in self._parameter_constraints],
         )
 
+    def compute_naive_center(self) -> TParameterization:
+        """Compute the naive center of the search space.
+
+        For range parameters, the center is the midpoint of the range. If the
+        parameter is log-scale, then the center point will correspond to the
+        mid-point in log-scale. If the parameter is logit-scale, then the center
+        point will correspond to the mid-point in logit-scale.
+        For choice parameters, the center point is determined as the value
+        that is at the middle of the values list.
+        For both choice and integer range parameters, ties are broken in
+        favor of the larger value / index. For example, a binary parameter with
+        values [0, 1] will be sampled as 1.
+        Fixed parameters are returned at their only allowed value.
+
+        Returns:
+            A parameterization with the center values for each parameter.
+        """
+        parameters = {}
+        derived_params = []
+        for name, p in self.parameters.items():
+            if isinstance(p, RangeParameter):
+                if p.logit_scale:
+                    center = expit((logit(p.lower) + logit(p.upper)) / 2.0)
+                elif p.log_scale:
+                    center = 10 ** ((math.log10(p.lower) + math.log10(p.upper)) / 2.0)
+                else:
+                    center = (float(p.lower) + float(p.upper)) / 2.0
+                parameters[name] = p.cast(center)
+            elif isinstance(p, ChoiceParameter):
+                parameters[name] = p.values[int(len(p.values) / 2)]
+            elif isinstance(p, FixedParameter):
+                parameters[name] = p.value
+            elif isinstance(p, DerivedParameter):
+                derived_params.append(p)
+            else:
+                raise NotImplementedError(f"Parameter type {type(p)} is not supported.")
+        for p in derived_params:
+            parameters[p.name] = p.compute(parameters=parameters)
+        if self.is_hierarchical:
+            parameters = self._cast_parameterization(parameters=parameters)
+        return parameters
+
+    def compute_chebyshev_center(self) -> dict[str, float] | None:
+        """Compute the Chebyshev center of the constraint polytope.
+
+        The Chebyshev center is the center of the largest inscribed ball in the
+        feasible region defined by the parameter constraints. This is computed
+        by solving a linear program. It is most limited by the tightest constraint.
+
+        For a polytope defined by a @ x <= b, the Chebyshev center (x_c, r) is
+        the solution to:
+            maximize r, where r is the radius of the inscribed ball
+            subject to: a_i^T x + r ||a_i||_2 <= b_i for all i
+
+        Note: this only considers natural (non-log, non-logit) range parameters.
+        Other parameter types are handled naively via compute_naive_center.
+
+        Returns:
+            A dictionary mapping parameter names to values at the Chebyshev center,
+            or None if the problem is infeasible.
+        """
+        # Only consider non-log, non-logit range parameters
+        natural_range_params = {
+            name: param
+            for name, param in self.range_parameters.items()
+            if not param.log_scale and not param.logit_scale
+        }
+
+        if not natural_range_params:
+            return {}
+
+        constraint_matrix = []
+        bound_vector = []
+        param_names = list(natural_range_params.keys())
+        num_params = len(natural_range_params)
+        param_name_to_idx = {name: idx for idx, name in enumerate(param_names)}
+
+        # Add parameter constraints
+        for constraint in self.parameter_constraints:
+            row = np.zeros(num_params)
+            for param_name, weight in constraint.constraint_dict.items():
+                if param_name in param_name_to_idx:
+                    row[param_name_to_idx[param_name]] = weight
+
+            constraint_matrix.append(row)
+            bound_vector.append(constraint.bound)
+
+        # Add parameter bounds
+        for name, idx in param_name_to_idx.items():
+            param = natural_range_params[name]
+            # lower bound: -x_i <= -lower_i
+            row_lower = np.zeros(num_params)
+            row_lower[idx] = -1.0
+            constraint_matrix.append(row_lower)
+            bound_vector.append(-float(param.lower))
+
+            # upper bound: x_i <= upper_i
+            row_upper = np.zeros(num_params)
+            row_upper[idx] = 1.0
+            constraint_matrix.append(row_upper)
+            bound_vector.append(float(param.upper))
+
+        constraint_matrix = np.array(constraint_matrix)
+        bound_vector = np.array(bound_vector)
+
+        # Compute norm for each vector in constraint matrix
+        row_norms = np.linalg.norm(constraint_matrix, axis=1)
+        augmented_constraint_matrix = np.column_stack([constraint_matrix, row_norms])
+
+        # Set objective vector which maximizes r (minimize -r == maximize r)
+        radius_objective_vector = np.zeros(num_params + 1)
+        radius_objective_vector[-1] = -1.0
+        result = linprog(
+            c=radius_objective_vector,
+            A_ub=augmented_constraint_matrix,
+            b_ub=bound_vector,
+            bounds=[(None, None)] * num_params + [(0, None)],  # no bounds except r >= 0
+        )
+
+        if not result.success or result.x is None:
+            return None
+
+        center_values = result.x[:num_params]  # remove r
+        center_dict = {
+            name: float(center_values[param_name_to_idx[name]]) for name in param_names
+        }
+        return center_dict
+
     def _validate_parameter_constraints(
         self, parameter_constraints: list[ParameterConstraint]
     ) -> None:
diff --git a/ax/generation_strategy/center_generation_node.py b/ax/generation_strategy/center_generation_node.py
@@ -6,7 +6,6 @@
 
 # pyre-strict
 
-import math
 from dataclasses import dataclass
 from typing import Any
 
@@ -16,13 +15,8 @@
 from ax.core.experiment import Experiment
 from ax.core.generator_run import GeneratorRun
 from ax.core.observation import ObservationFeatures
-from ax.core.parameter import (
-    ChoiceParameter,
-    DerivedParameter,
-    FixedParameter,
-    RangeParameter,
-)
-from ax.core.search_space import SearchSpace
+from ax.core.parameter import DerivedParameter
+from ax.core.search_space import HierarchicalSearchSpace, SearchSpace
 from ax.core.types import TParameterization
 from ax.exceptions.generation_strategy import AxGenerationException
 from ax.generation_strategy.external_generation_node import ExternalGenerationNode
@@ -31,7 +25,6 @@
     AutoTransitionAfterGenOrExhaustion,
 )
 from pyre_extensions import none_throws
-from scipy.special import expit, logit
 
 
 @dataclass(init=False)
@@ -88,17 +81,16 @@ def gen(
         """
         # Check if center already exists or is infeasible
         self.search_space = experiment.search_space
-        center_params = self._compute_center_params()
-        search_space = none_throws(self.search_space)
+        center_params = self.compute_center_params()
 
-        # Check if center already exists in experiment
-        center_arm = Arm(parameters=center_params)
-        if center_arm.signature in experiment.arms_by_signature:
+        # Check if unable to find a suitable center
+        if center_params is None:
             self._should_skip = True
             return None
 
-        # Check if center violates parameter constraints
-        if not search_space.check_membership(parameterization=center_params):
+        # Check if center already exists in experiment
+        center_arm = Arm(parameters=center_params)
+        if center_arm.signature in experiment.arms_by_signature:
             self._should_skip = True
             return None
 
@@ -112,33 +104,43 @@ def gen(
             **gs_gen_kwargs,
         )
 
-    def _compute_center_params(self) -> TParameterization:
-        """Compute the center of the search space."""
+    def compute_center_params(self) -> TParameterization | None:
+        """Compute the center of the search space.
+
+        Returns:
+            The center parameters, or None if the center cannot be computed
+            (e.g., due to infeasible constraints).
+        """
         search_space = none_throws(self.search_space)
-        parameters = {}
-        derived_params = []
-        for name, p in search_space.parameters.items():
-            if isinstance(p, RangeParameter):
-                if p.logit_scale:
-                    # Leverage scipy's numerically stable logit and expit functions
-                    center = expit((logit(p.lower) + logit(p.upper)) / 2.0)
-                elif p.log_scale:
-                    center = 10 ** ((math.log10(p.lower) + math.log10(p.upper)) / 2.0)
-                else:
-                    center = (float(p.lower) + float(p.upper)) / 2.0
-                parameters[name] = p.cast(center)
-            elif isinstance(p, ChoiceParameter):
-                parameters[name] = p.values[int(len(p.values) / 2)]
-            elif isinstance(p, FixedParameter):
-                parameters[name] = p.value
-            elif isinstance(p, DerivedParameter):
-                derived_params.append(p)
-            else:
-                raise NotImplementedError(f"Parameter type {type(p)} is not supported.")
-        for p in derived_params:
-            parameters[p.name] = p.compute(parameters=parameters)
-        if search_space.is_hierarchical:
-            parameters = search_space._cast_parameterization(parameters=parameters)
+        parameters = search_space.compute_naive_center()
+
+        # Check for search space membership, which will check if the generated
+        # point satisfies the parameter constraints. Fallback to Chebyshev center
+        if not search_space.check_membership(parameterization=parameters):
+            chebyshev_center = search_space.compute_chebyshev_center()
+            if chebyshev_center is not None:
+                for name, value in chebyshev_center.items():
+                    if name in parameters:
+                        parameters[name] = search_space[name].cast(value)
+
+            # recompute derived parameters using the updated parameter values
+            derived_params = [
+                p
+                for p in search_space.parameters.values()
+                if isinstance(p, DerivedParameter)
+            ]
+            for p in derived_params:
+                parameters[p.name] = p.compute(parameters=parameters)
+
+            if isinstance(search_space, HierarchicalSearchSpace):
+                parameters = search_space._cast_parameterization(parameters=parameters)
+
+            # Return None if something goes wrong, or some non-range parameter
+            # remains out of search space
+            if chebyshev_center is None or not search_space.check_membership(
+                parameterization=parameters
+            ):
+                return None
         return parameters
 
     def get_next_candidate(
@@ -156,18 +158,18 @@ def get_next_candidate(
         favor of the larger value / index. For example, a binary parameter with
         values [0, 1] will be sampled as 1.
         Fixed parameters are returned at their only allowed value.
-        """
-        search_space = none_throws(self.search_space)
-        parameters = self._compute_center_params()
 
-        # Check for search space membership, which will check if the generated
-        # point satisfies the parameter constraints.
-        if not search_space.check_membership(parameterization=parameters):
-            # TODO: Improve this handling by instead choosing the point
-            # in the center of the feasible set (e.g. by finding the)
-            # Chebyshev center of the constraint polytope.
+        Note: If range naive midpoint fails to remain within parameter constraints, we
+        attempt to compute the Chebyshev center of the constraint polytope defined by
+        parameter bounds and parameter constraints w.r.t non-log range parameters.
+        This finds the center of the largest inscribed ball in the feasible region.
+        """
+        center_params = self.compute_center_params()
+        if center_params is None:
+            # raising an exception here will cause fallback to sobol, currently
+            # it should be very unlikely to hit this case
             raise AxGenerationException(
-                "Center of the search space does not satisfy parameter constraints. "
-                "The generation strategy will fallback to Sobol. "
+                "Center of the search space does not satisfy parameter "
+                "constraints. The generation strategy will fallback to Sobol. "
             )
-        return parameters
+        return center_params
diff --git a/ax/generation_strategy/tests/test_center_generation_node.py b/ax/generation_strategy/tests/test_center_generation_node.py