From 5e9bf72c8cc517194a668ceb26cb853da3511bef Mon Sep 17 00:00:00 2001
From: Elizabeth Santorella <santorella@meta.com>
Date: Wed, 23 Oct 2024 13:28:14 -0700
Subject: [PATCH] Move noise_std, constraint_noise_std, and negate from
 `ParamBasedTestProblem` to `SyntheticProblemRunner` (#2926)

Summary:

Context: Noise and negation are (somewhat surprisingly!) handled by the runner, even though similar attributes exist on BoTorch test problems. This is confusing; it is better to _require_ these to be set on the runner and to raise an exception if they are set on the test problem.

Also, a `ParamBasedTestProblem` should be as minimal as possible, since it is the only benchmark class that needs to be repeatedly subclassed.

Furthermore, this makes the code easier to work with by moving these arguments to a shallower level in the stack, making them easier to access and reducing the need to pass dicts of parameters.

This PR:
* Adds `noise_std`, `constraint_noise_std`, and `negate` to `SyntheticProblemRunner`
* Removes those arguments from `ParamBasedTestProblem` and all its subclasses
* Updates references
* Adds an exception if those arguments are present when creating a runner based on a BoTorch problem

Reviewed By: Balandat

Differential Revision: D64575398
---
 ax/benchmark/benchmark_problem.py             | 13 +++++++
 .../problems/synthetic/hss/jenatton.py        |  4 +-
 ax/benchmark/runners/botorch_test.py          | 30 +++++++++++----
 ax/benchmark/tests/methods/test_methods.py    |  4 +-
 .../problems/synthetic/hss/test_jenatton.py   |  8 +---
 .../runners/test_botorch_test_problem.py      | 37 +++++++++++++++----
 ax/benchmark/tests/test_benchmark.py          |  3 +-
 ax/benchmark/tests/test_benchmark_problem.py  | 14 +++----
 ax/utils/testing/benchmark_stubs.py           |  2 +
 9 files changed, 80 insertions(+), 35 deletions(-)

diff --git a/ax/benchmark/benchmark_problem.py b/ax/benchmark/benchmark_problem.py
index 720f0a6332b..971becca18c 100644
--- a/ax/benchmark/benchmark_problem.py
+++ b/ax/benchmark/benchmark_problem.py
@@ -298,6 +298,9 @@ def create_problem_from_botorch(
     *,
     test_problem_class: type[BaseTestProblem],
     test_problem_kwargs: dict[str, Any],
+    noise_std: float | list[float] | None = None,
+    constraint_noise_std: float | list[float] | None = None,
+    negate: bool = False,
     num_trials: int,
     lower_is_better: bool = True,
     observe_noise_sd: bool = False,
@@ -316,6 +319,13 @@ def create_problem_from_botorch(
             to define the `search_space`, `optimization_config`, and `runner`.
         test_problem_kwargs: Keyword arguments used to instantiate the
             `test_problem_class`.
+        noise_std: Standard deviation of synthetic noise added to objectives. If
+            `None`, no noise is added. If a float, the same noise level is used
+            for all objectives.
+        constraint_noise_std: Standard deviation of synthetic noise added to
+            constraints.
+        negate: Whether the values produced by the test function should be
+            negated. Does not apply to constraints.
         lower_is_better: Whether this is a minimization problem. For MOO, this
             applies to all objectives.
         num_trials: Simply the `num_trials` of the `BenchmarkProblem` created.
@@ -382,6 +392,9 @@ def create_problem_from_botorch(
                 search_space=search_space,
                 param_names=list(search_space.parameters.keys()),
             ),
+            noise_std=noise_std,
+            negate=negate,
+            constraint_noise_std=constraint_noise_std,
         ),
         num_trials=num_trials,
         observe_noise_stds=observe_noise_sd,
diff --git a/ax/benchmark/problems/synthetic/hss/jenatton.py b/ax/benchmark/problems/synthetic/hss/jenatton.py
index 1e87e3de9df..3c80b0c6091 100644
--- a/ax/benchmark/problems/synthetic/hss/jenatton.py
+++ b/ax/benchmark/problems/synthetic/hss/jenatton.py
@@ -55,8 +55,6 @@ def jenatton_test_function(
 class Jenatton(ParamBasedTestProblem):
     """Jenatton test function for hierarchical search spaces."""
 
-    noise_std: float | None = None
-    negate: bool = False
     num_objectives: int = 1
 
     # pyre-fixme[14]: Inconsistent override
@@ -125,7 +123,7 @@ def get_jenatton_benchmark_problem(
         search_space=search_space,
         optimization_config=optimization_config,
         runner=ParamBasedTestProblemRunner(
-            test_problem=Jenatton(noise_std=noise_std), outcome_names=[name]
+            test_problem=Jenatton(), outcome_names=[name], noise_std=noise_std
         ),
         num_trials=num_trials,
         observe_noise_stds=observe_noise_sd,
diff --git a/ax/benchmark/runners/botorch_test.py b/ax/benchmark/runners/botorch_test.py
index 802f154923e..afd4a522ca0 100644
--- a/ax/benchmark/runners/botorch_test.py
+++ b/ax/benchmark/runners/botorch_test.py
@@ -28,9 +28,6 @@ class ParamBasedTestProblem(ABC):
     """
 
     num_objectives: int
-    constraint_noise_std: float | list[float] | None = None
-    noise_std: float | list[float] | None = None
-    negate: bool = False
 
     @abstractmethod
     def evaluate_true(self, params: Mapping[str, TParamValue]) -> Tensor:
@@ -74,19 +71,22 @@ class SyntheticProblemRunner(BenchmarkRunner, ABC):
 
     test_problem: BaseTestProblem | ParamBasedTestProblem
     modified_bounds: list[tuple[float, float]] | None = None
+    constraint_noise_std: float | list[float] | None = None
+    noise_std: float | list[float] | None = None
+    negate: bool = False
 
     @property
     def _is_constrained(self) -> bool:
         return isinstance(self.test_problem, ConstrainedBaseTestProblem)
 
     def get_noise_stds(self) -> None | float | dict[str, float]:
-        noise_std = self.test_problem.noise_std
+        noise_std = self.noise_std
         noise_std_dict: dict[str, float] = {}
         num_obj = self.test_problem.num_objectives
 
         # populate any noise_stds for constraints
         if self._is_constrained:
-            constraint_noise_std = self.test_problem.constraint_noise_std
+            constraint_noise_std = self.constraint_noise_std
             if isinstance(constraint_noise_std, list):
                 for i, cns in enumerate(constraint_noise_std, start=num_obj):
                     if cns is not None:
@@ -141,6 +141,22 @@ class BotorchTestProblemRunner(SyntheticProblemRunner):
 
     def __post_init__(self, search_space_digest: SearchSpaceDigest | None) -> None:
         super().__post_init__(search_space_digest=search_space_digest)
+        if self.test_problem.noise_std is not None:
+            raise ValueError(
+                "noise_std should be set on the runner, not the test problem."
+            )
+        if (
+            hasattr(self.test_problem, "constraint_noise_std")
+            and self.test_problem.constraint_noise_std is not None
+        ):
+            raise ValueError(
+                "constraint_noise_std should be set on the runner, not the test "
+                "problem."
+            )
+        if self.test_problem.negate:
+            raise ValueError(
+                "negate should be set on the runner, not the test problem."
+            )
         self.test_problem = self.test_problem.to(dtype=torch.double)
 
     def get_Y_true(self, params: Mapping[str, TParamValue]) -> Tensor:
@@ -174,7 +190,7 @@ def get_Y_true(self, params: Mapping[str, TParamValue]) -> Tensor:
 
         Y_true = self.test_problem.evaluate_true(X).view(-1)
         # `BaseTestProblem.evaluate_true()` does not negate the outcome
-        if self.test_problem.negate:
+        if self.negate:
             Y_true = -Y_true
 
         if self._is_constrained:
@@ -228,6 +244,6 @@ def get_Y_true(self, params: Mapping[str, TParamValue]) -> Tensor:
         """
         Y_true = self.test_problem.evaluate_true(params).view(-1)
         # `ParamBasedTestProblem.evaluate_true()` does not negate the outcome
-        if self.test_problem.negate:
+        if self.negate:
             Y_true = -Y_true
         return Y_true
diff --git a/ax/benchmark/tests/methods/test_methods.py b/ax/benchmark/tests/methods/test_methods.py
index 63d974e53b4..cdf54f95126 100644
--- a/ax/benchmark/tests/methods/test_methods.py
+++ b/ax/benchmark/tests/methods/test_methods.py
@@ -138,9 +138,7 @@ def test_sobol(self) -> None:
     def _test_get_best_parameters(
         self, use_model_predictions: bool, as_batch: bool
     ) -> None:
-        problem = get_problem(
-            problem_key="ackley4", num_trials=2, test_problem_kwargs={"noise_std": 1.0}
-        )
+        problem = get_problem(problem_key="ackley4", num_trials=2, noise_std=1.0)
 
         method = get_sobol_botorch_modular_acquisition(
             model_cls=SingleTaskGP,
diff --git a/ax/benchmark/tests/problems/synthetic/hss/test_jenatton.py b/ax/benchmark/tests/problems/synthetic/hss/test_jenatton.py
index 2ef8e71eed9..953ea7be3aa 100644
--- a/ax/benchmark/tests/problems/synthetic/hss/test_jenatton.py
+++ b/ax/benchmark/tests/problems/synthetic/hss/test_jenatton.py
@@ -107,9 +107,7 @@ def test_create_problem(self) -> None:
         self.assertTrue(objective.minimize)
         self.assertTrue(metric.lower_is_better)
         self.assertEqual(
-            assert_is_instance(
-                problem.runner, ParamBasedTestProblemRunner
-            ).test_problem.noise_std,
+            assert_is_instance(problem.runner, ParamBasedTestProblemRunner).noise_std,
             0.0,
         )
         self.assertFalse(assert_is_instance(metric, BenchmarkMetric).observe_noise_sd)
@@ -121,9 +119,7 @@ def test_create_problem(self) -> None:
         metric = objective.metric
         self.assertTrue(metric.lower_is_better)
         self.assertEqual(
-            assert_is_instance(
-                problem.runner, ParamBasedTestProblemRunner
-            ).test_problem.noise_std,
+            assert_is_instance(problem.runner, ParamBasedTestProblemRunner).noise_std,
             0.1,
         )
         self.assertTrue(assert_is_instance(metric, BenchmarkMetric).observe_noise_sd)
diff --git a/ax/benchmark/tests/runners/test_botorch_test_problem.py b/ax/benchmark/tests/runners/test_botorch_test_problem.py
index 7edfac3015b..77e11fe42d5 100644
--- a/ax/benchmark/tests/runners/test_botorch_test_problem.py
+++ b/ax/benchmark/tests/runners/test_botorch_test_problem.py
@@ -31,11 +31,35 @@
 
 
 class TestSyntheticRunner(TestCase):
+    def test_runner_raises_for_botorch_attrs(self) -> None:
+        with self.assertRaisesRegex(
+            ValueError, "noise_std should be set on the runner, not the test problem."
+        ):
+            BotorchTestProblemRunner(
+                test_problem=Hartmann(dim=6, noise_std=0.1),
+                outcome_names=["objective"],
+            )
+        with self.assertRaisesRegex(
+            ValueError,
+            "constraint_noise_std should be set on the runner, not the test problem.",
+        ):
+            BotorchTestProblemRunner(
+                test_problem=ConstrainedHartmann(dim=6, constraint_noise_std=0.1),
+                outcome_names=["objective", "constraint"],
+            )
+        with self.assertRaisesRegex(
+            ValueError, "negate should be set on the runner, not the test problem."
+        ):
+            BotorchTestProblemRunner(
+                test_problem=Hartmann(dim=6, negate=True),
+                outcome_names=["objective"],
+            )
+
     def test_synthetic_runner(self) -> None:
         botorch_cases = [
             (
                 BotorchTestProblemRunner,
-                test_problem_class(dim=6, noise_std=noise_std),
+                test_problem_class(dim=6),
                 modified_bounds,
                 noise_std,
             )
@@ -48,9 +72,7 @@ def test_synthetic_runner(self) -> None:
         param_based_cases = [
             (
                 ParamBasedTestProblemRunner,
-                TestParamBasedTestProblem(
-                    num_objectives=num_objectives, dim=6, noise_std=noise_std
-                ),
+                TestParamBasedTestProblem(num_objectives=num_objectives, dim=6),
                 None,
                 noise_std,
             )
@@ -76,6 +98,7 @@ def test_synthetic_runner(self) -> None:
                 test_problem=test_problem,
                 outcome_names=outcome_names,
                 modified_bounds=modified_bounds,
+                noise_std=noise_std,
             )
 
             test_description: str = (
@@ -168,9 +191,9 @@ def test_synthetic_runner(self) -> None:
 
     def test_botorch_test_problem_runner_heterogeneous_noise(self) -> None:
         runner = BotorchTestProblemRunner(
-            test_problem=ConstrainedHartmann(
-                dim=6, noise_std=0.1, constraint_noise_std=0.05
-            ),
+            test_problem=ConstrainedHartmann(dim=6),
+            noise_std=0.1,
+            constraint_noise_std=0.05,
             outcome_names=["objective", "constraint"],
         )
         self.assertDictEqual(
diff --git a/ax/benchmark/tests/test_benchmark.py b/ax/benchmark/tests/test_benchmark.py
index e90aec58f1f..fed952aef17 100644
--- a/ax/benchmark/tests/test_benchmark.py
+++ b/ax/benchmark/tests/test_benchmark.py
@@ -202,12 +202,11 @@ def _test_replication_with_inference_value(
             num_sobol_trials=3,
         )
 
-        test_problem_kwargs = {"noise_std": 100.0}
         num_trials = 4
         problem = get_single_objective_benchmark_problem(
-            test_problem_kwargs=test_problem_kwargs,
             num_trials=num_trials,
             report_inference_value_as_trace=report_inference_value_as_trace,
+            noise_std=100.0,
         )
         res = benchmark_replication(problem=problem, method=method, seed=seed)
         # The inference trace could coincide with the oracle trace, but it won't
diff --git a/ax/benchmark/tests/test_benchmark_problem.py b/ax/benchmark/tests/test_benchmark_problem.py
index 388f4c87c77..f9818f8cae1 100644
--- a/ax/benchmark/tests/test_benchmark_problem.py
+++ b/ax/benchmark/tests/test_benchmark_problem.py
@@ -204,19 +204,18 @@ def _test_constrained_from_botorch(
     ) -> None:
         ax_problem = create_problem_from_botorch(
             test_problem_class=test_problem_class,
-            test_problem_kwargs={
-                "noise_std": objective_noise_std,
-                "constraint_noise_std": constraint_noise_std,
-            },
+            test_problem_kwargs={},
             lower_is_better=True,
             num_trials=1,
             observe_noise_sd=observe_noise_sd,
+            noise_std=objective_noise_std,
+            constraint_noise_std=constraint_noise_std,
         )
         runner = checked_cast(BotorchTestProblemRunner, ax_problem.runner)
         self.assertTrue(runner._is_constrained)
         botorch_problem = checked_cast(ConstrainedBaseTestProblem, runner.test_problem)
-        self.assertEqual(botorch_problem.noise_std, objective_noise_std)
-        self.assertEqual(botorch_problem.constraint_noise_std, constraint_noise_std)
+        self.assertEqual(runner.noise_std, objective_noise_std)
+        self.assertEqual(runner.constraint_noise_std, constraint_noise_std)
         opt_config = ax_problem.optimization_config
         outcome_constraints = opt_config.outcome_constraints
         self.assertEqual(
@@ -376,8 +375,9 @@ def test_get_oracle_experiment_from_params(self) -> None:
     def test_get_oracle_experiment_from_experiment(self) -> None:
         problem = create_problem_from_botorch(
             test_problem_class=Branin,
-            test_problem_kwargs={"negate": True},
+            test_problem_kwargs={},
             num_trials=5,
+            negate=True,
         )
 
         # empty experiment
diff --git a/ax/utils/testing/benchmark_stubs.py b/ax/utils/testing/benchmark_stubs.py
index 2c58ede49e6..0bf7d49c4dd 100644
--- a/ax/utils/testing/benchmark_stubs.py
+++ b/ax/utils/testing/benchmark_stubs.py
@@ -48,6 +48,7 @@ def get_single_objective_benchmark_problem(
     num_trials: int = 4,
     test_problem_kwargs: dict[str, Any] | None = None,
     report_inference_value_as_trace: bool = False,
+    noise_std: float | list[float] | None = None,
 ) -> BenchmarkProblem:
     return create_problem_from_botorch(
         test_problem_class=Branin,
@@ -55,6 +56,7 @@ def get_single_objective_benchmark_problem(
         num_trials=num_trials,
         observe_noise_sd=observe_noise_sd,
         report_inference_value_as_trace=report_inference_value_as_trace,
+        noise_std=noise_std,
     )