MultiObjective model and modelbridge

Summary: Large refactor to begin adding richer support for MultiObjective API and to support qNEHVI. * Creates MultiObjectiveBotorchModel and MultiObjectiveTorchModelBridge and adds "ref_point" to those apis along with moving logic for handling random and chebyshev scalarization methods. * Declutter botorch_defaults by creating botorch_moo_defaults for multi-objective-specific methods. * Update other APIs. Pending (not necessarily this diff) * Smarter "ref_point" inference. * Move and add unit tests. (Scalarization partially tested in "test_botorch_models; EHVI not tested) * qNEHVI * Pareto frontier and hypervolume methods in Modelbridge Reviewed By: sdaulton Differential Revision: D22412876 fbshipit-source-id: 3d256dd3908408c214c00ca4be104d1d35552ecc
facebook · Aug 25, 2020 · 272b6dd · 272b6dd
1 parent 1ecee1b
commit 272b6dd
Show file tree

Hide file tree

Showing 17 changed files with 1,550 additions and 331 deletions.
diff --git a/ax/modelbridge/__init__.py b/ax/modelbridge/__init__.py
@@ -15,6 +15,7 @@
     get_thompson,
     get_uniform,
 )
+from ax.modelbridge.multi_objective_torch import MultiObjectiveTorchModelBridge
 from ax.modelbridge.numpy import NumpyModelBridge
 from ax.modelbridge.torch import TorchModelBridge
 
@@ -24,6 +25,7 @@
     "Models",
     "NumpyModelBridge",
     "TorchModelBridge",
+    "MultiObjectiveTorchModelBridge",
     "get_factorial",
     "get_GPEI",
     "get_GPKG",

diff --git a/ax/modelbridge/base.py b/ax/modelbridge/base.py
@@ -653,6 +653,7 @@ def gen(
                 arms_by_signature=self._arms_by_signature,
             )
             best_arm = best_arms[0]
+
         arms, candidate_metadata = gen_arms(
             observation_features=observation_features,
             arms_by_signature=self._arms_by_signature,

diff --git a/ax/modelbridge/factory.py b/ax/modelbridge/factory.py
@@ -17,6 +17,7 @@
 from ax.core.search_space import SearchSpace
 from ax.core.types import TConfig
 from ax.modelbridge.discrete import DiscreteModelBridge
+from ax.modelbridge.multi_objective_torch import MultiObjectiveTorchModelBridge
 from ax.modelbridge.random import RandomModelBridge
 from ax.modelbridge.registry import (
     Cont_X_trans,
@@ -363,14 +364,51 @@ def get_GPMES(
     return checked_cast(TorchModelBridge, Models.GPMES(**inputs))  # pyre-ignore: [16]
 
 
+def get_MOO_EHVI(
+    experiment: Experiment,
+    data: Data,
+    ref_point: List[float],
+    search_space: Optional[SearchSpace] = None,
+    dtype: torch.dtype = torch.double,
+    device: torch.device = (
+        torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu")
+    ),
+) -> MultiObjectiveTorchModelBridge:
+    """Instantiates a multi-objective model that generates points with EHVI.
+
+    Requires a `ref_point`, a list of the baseline value for every objective being
+    optimized. An arm only improves hypervolume if it is strictly better than this
+    point in all metrics.
+    """
+    # pyre-ignore: [16] `Optional` has no attribute `objective`.
+    if not isinstance(experiment.optimization_config.objective, MultiObjective):
+        raise ValueError("Multi-objective optimization requires multiple objectives.")
+    if data.df.empty:  # pragma: no cover
+        raise ValueError("MultiObjectiveOptimization requires non-empty data.")
+    return checked_cast(
+        MultiObjectiveTorchModelBridge,
+        Models.MOO(
+            experiment=experiment,
+            data=data,
+            ref_point=ref_point,
+            search_space=search_space or experiment.search_space,
+            torch_dtype=dtype,
+            torch_device=device,
+            default_model_gen_options={
+                "acquisition_function_kwargs": {"sequential": True}
+            },
+        ),
+    )
+
+
 def get_MOO_PAREGO(
     experiment: Experiment,
     data: Data,
     ref_point: Optional[List[float]] = None,
     search_space: Optional[SearchSpace] = None,
     dtype: torch.dtype = torch.double,
     device: torch.device = DEFAULT_TORCH_DEVICE,
-) -> TorchModelBridge:
+) -> MultiObjectiveTorchModelBridge:
     """Instantiates a multi-objective model that generates points with ParEGO.
 
     qParEGO optimizes random augmented chebyshev scalarizations of the multiple
@@ -382,14 +420,15 @@ def get_MOO_PAREGO(
     if data.df.empty:
         raise ValueError("MultiObjectiveOptimization requires non-empty data.")
     return checked_cast(
-        TorchModelBridge,
-        Models.BOTORCH(
+        MultiObjectiveTorchModelBridge,
+        Models.MOO(
             experiment=experiment,
             data=data,
+            ref_point=ref_point,
             search_space=search_space or experiment.search_space,
             torch_dtype=dtype,
             torch_device=device,
-            ref_point=None,
+            acqf_constructor=get_NEI,
             default_model_gen_options={
                 "acquisition_function_kwargs": {
                     "chebyshev_scalarization": True,
@@ -407,8 +446,8 @@ def get_MOO_RS(
     search_space: Optional[SearchSpace] = None,
     dtype: torch.dtype = torch.double,
     device: torch.device = DEFAULT_TORCH_DEVICE,
-) -> TorchModelBridge:
-    """Instantiates a Linear Random Scalarization multi-objective model.
+) -> MultiObjectiveTorchModelBridge:
+    """Instantiates a Random Scalarization multi-objective model.
 
     Chooses a different random linear scalarization of the objectives
     for generating each new candidate arm. This will only explore the
@@ -420,13 +459,15 @@ def get_MOO_RS(
     if data.df.empty:
         raise ValueError("MultiObjectiveOptimization requires non-empty data.")
     return checked_cast(
-        TorchModelBridge,
-        Models.BOTORCH(
+        MultiObjectiveTorchModelBridge,
+        Models.MOO(
             experiment=experiment,
             data=data,
+            ref_point=ref_point,
             search_space=search_space or experiment.search_space,
             torch_dtype=dtype,
             torch_device=device,
+            acqf_constructor=get_NEI,
             default_model_gen_options={
                 "acquisition_function_kwargs": {
                     "random_scalarization": True,

diff --git a/ax/modelbridge/multi_objective_torch.py b/ax/modelbridge/multi_objective_torch.py
@@ -0,0 +1,245 @@
+#!/usr/bin/env python3
+# Copyright (c) Facebook, Inc. and its affiliates.
+#
+# This source code is licensed under the MIT license found in the
+# LICENSE file in the root directory of this source tree.
+
+from typing import Callable, Dict, List, Optional, Tuple, Type
+
+import numpy as np
+import torch
+from ax.core.data import Data
+from ax.core.experiment import Experiment
+from ax.core.generator_run import GeneratorRun
+from ax.core.multi_type_experiment import MultiTypeExperiment
+from ax.core.observation import ObservationData, ObservationFeatures
+from ax.core.optimization_config import OptimizationConfig
+from ax.core.search_space import SearchSpace
+from ax.core.types import TCandidateMetadata, TConfig, TGenMetadata
+from ax.modelbridge.array import FIT_MODEL_ERROR
+from ax.modelbridge.torch import TorchModelBridge
+from ax.modelbridge.transforms.base import Transform
+from ax.models.torch_base import TorchModel
+from ax.utils.common.logger import get_logger
+from torch import Tensor
+
+
+logger = get_logger("MultiObjectiveTorchModelBridge")
+
+
+class MultiObjectiveTorchModelBridge(TorchModelBridge):
+    """A model bridge for using multi-objective torch-based models.
+
+    Specifies an interface that is implemented by MultiObjectiveTorchModel. In
+    particular, model should have methods fit, predict, and gen. See
+    MultiObjectiveTorchModel for the API for each of these methods.
+
+    Requires that all parameters have been transformed to RangeParameters
+    or FixedParameters with float type and no log scale.
+
+    This class converts Ax parameter types to torch tensors before passing
+    them to the model.
+    """
+
+    _transformed_ref_point: Optional[List[float]]
+    _objective_metric_names: Optional[List[str]]
+
+    def __init__(
+        self,
+        experiment: Experiment,
+        search_space: SearchSpace,
+        data: Data,
+        model: TorchModel,
+        transforms: List[Type[Transform]],
+        transform_configs: Optional[Dict[str, TConfig]] = None,
+        torch_dtype: Optional[torch.dtype] = None,  # noqa T484
+        torch_device: Optional[torch.device] = None,
+        status_quo_name: Optional[str] = None,
+        status_quo_features: Optional[ObservationFeatures] = None,
+        optimization_config: Optional[OptimizationConfig] = None,
+        fit_out_of_design: bool = False,
+        ref_point: Optional[List[float]] = None,
+        default_model_gen_options: Optional[TConfig] = None,
+    ) -> None:
+        if isinstance(experiment, MultiTypeExperiment) and ref_point is not None:
+            raise NotImplementedError(
+                "Ref-point dependent multi-objective optimization algorithms "
+                "like EHVI are not yet supported for MultiTypeExperiments. "
+                "Remove the reference point arg and use a compatible algorithm "
+                "like ParEGO."
+            )
+        self.ref_point = ref_point
+        self._transformed_ref_point = None
+        self._objective_metric_names = None
+        oc = optimization_config or experiment.optimization_config
+        if oc:
+            self._objective_metric_names = [m.name for m in oc.objective.metrics]
+        super().__init__(
+            experiment=experiment,
+            search_space=search_space,
+            data=data,
+            model=model,
+            transforms=transforms,
+            transform_configs=transform_configs,
+            torch_dtype=torch_dtype,
+            torch_device=torch_device,
+            status_quo_name=status_quo_name,
+            status_quo_features=status_quo_features,
+            optimization_config=optimization_config,
+            fit_out_of_design=fit_out_of_design,
+            default_model_gen_options=default_model_gen_options,
+        )
+
+    def _model_gen(
+        self,
+        n: int,
+        bounds: List[Tuple[float, float]],
+        objective_weights: np.ndarray,
+        outcome_constraints: Optional[Tuple[np.ndarray, np.ndarray]],
+        linear_constraints: Optional[Tuple[np.ndarray, np.ndarray]],
+        fixed_features: Optional[Dict[int, float]],
+        pending_observations: Optional[List[np.ndarray]],
+        model_gen_options: Optional[TConfig],
+        rounding_func: Callable[[np.ndarray], np.ndarray],
+        target_fidelities: Optional[Dict[int, float]],
+    ) -> Tuple[np.ndarray, np.ndarray, TGenMetadata, List[TCandidateMetadata]]:
+        if not self.model:  # pragma: no cover
+            raise ValueError(FIT_MODEL_ERROR.format(action="_model_gen"))
+        obj_w, oc_c, l_c, pend_obs = self._validate_and_convert_to_tensors(
+            objective_weights=objective_weights,
+            outcome_constraints=outcome_constraints,
+            linear_constraints=linear_constraints,
+            pending_observations=pending_observations,
+        )
+        ref_point = None
+        if self._transformed_ref_point:
+            ref_point = self._transformed_ref_point
+        elif self.ref_point:
+            # Assign ref point if available.
+            logger.warning(
+                "No attribute _transformed_ref_point. Using untransformed ref_point."
+            )
+            ref_point = self.ref_point
+        tensor_rounding_func = self._array_callable_to_tensor_callable(rounding_func)
+        augmented_model_gen_options = {
+            **self._default_model_gen_options,
+            **(model_gen_options or {}),
+        }
+        # pyre-fixme[16]: `Optional` has no attribute `gen`.
+        X, w, gen_metadata, candidate_metadata = self.model.gen(
+            n=n,
+            bounds=bounds,
+            objective_weights=obj_w,
+            outcome_constraints=oc_c,
+            linear_constraints=l_c,
+            fixed_features=fixed_features,
+            pending_observations=pend_obs,
+            model_gen_options=augmented_model_gen_options,
+            rounding_func=tensor_rounding_func,
+            target_fidelities=target_fidelities,
+            ref_point=ref_point,
+        )
+        return (
+            X.detach().cpu().clone().numpy(),
+            w.detach().cpu().clone().numpy(),
+            gen_metadata,
+            candidate_metadata,
+        )
+
+    def _transform_data(
+        self,
+        obs_feats: List[ObservationFeatures],
+        obs_data: List[ObservationData],
+        search_space: SearchSpace,
+        transforms: Optional[List[Type[Transform]]],
+        transform_configs: Optional[Dict[str, TConfig]],
+    ) -> Tuple[List[ObservationFeatures], List[ObservationData], SearchSpace]:
+        """Initialize transforms and apply them to provided data."""
+        # Run superclass version to fit transforms to observations
+        obs_feats, obs_data, search_space = super()._transform_data(
+            obs_feats=obs_feats,
+            obs_data=obs_data,
+            search_space=search_space,
+            transforms=transforms,
+            transform_configs=transform_configs,
+        )
+
+        ref_point = self.ref_point
+        metric_names = list(self._metric_names or [])
+        objective_metric_names = list(self._objective_metric_names or [])
+        if ref_point and metric_names and objective_metric_names:
+            num_metrics = len(metric_names)
+            ref_dict = dict(zip(objective_metric_names, ref_point))
+            if obs_data:
+                # Create synthetic ObservationData representing the reference point.
+                # Pad with non-objective outcomes from existing data.
+                # Should always have existing data with BO.
+                sample_obs_data = obs_data[0]
+                padded_ref_dict: Dict[str, float] = dict(
+                    zip(sample_obs_data.metric_names, sample_obs_data.means)
+                )
+                padded_ref_dict.update(ref_dict)
+                ref_obs_data = [
+                    ObservationData(
+                        metric_names=list(padded_ref_dict.keys()),
+                        means=np.array(list(padded_ref_dict.values())),
+                        covariance=np.zeros((num_metrics, num_metrics)),
+                    )
+                ]
+                ref_obs_feats = []
+
+                # Apply initialized transforms to reference point.
+                for t in self.transforms.values():
+                    ref_obs_data = t.transform_observation_data(
+                        ref_obs_data, ref_obs_feats
+                    )
+                transformed_ref_obsd = ref_obs_data.pop()
+                transformed_ref_dict = dict(
+                    zip(transformed_ref_obsd.metric_names, transformed_ref_obsd.means)
+                )
+                self._transformed_ref_point = []
+                for objective_metric_name in objective_metric_names:
+                    # pyre-fixme[16]
+                    self._transformed_ref_point.append(
+                        transformed_ref_dict[objective_metric_name]
+                    )
+            else:
+                # No previous data means transform can't have been fit.
+                pass
+        return obs_feats, obs_data, search_space
+
+    def gen(
+        self,
+        n: int,
+        search_space: Optional[SearchSpace] = None,
+        optimization_config: Optional[OptimizationConfig] = None,
+        pending_observations: Optional[Dict[str, List[ObservationFeatures]]] = None,
+        fixed_features: Optional[ObservationFeatures] = None,
+        model_gen_options: Optional[TConfig] = None,
+    ) -> GeneratorRun:
+        if optimization_config:
+            # Update objective metric names if new optimization config is present.
+            self._objective_metric_names = [
+                m.name for m in optimization_config.objective.metrics
+            ]
+        return super().gen(
+            n=n,
+            search_space=search_space,
+            optimization_config=optimization_config,
+            pending_observations=pending_observations,
+            fixed_features=fixed_features,
+            model_gen_options=model_gen_options,
+        )
+
+    # TODO: Complete these stubs based on https://fb.quip.com/fUMRATIeahCy
+    def pareto_frontier(self, X: Tensor) -> Tensor:
+        raise NotImplementedError()
+
+    def observed_pareto_frontier(self) -> Tensor:
+        raise NotImplementedError()
+
+    def hypervolume(self, X: Tensor) -> Tensor:
+        raise NotImplementedError()
+
+    def observed_hypervolume(self) -> Tensor:
+        raise NotImplementedError()