Source code for syne_tune.optimizer.schedulers.multiobjective.expected_hyper_volume_improvement

from typing import Optional, List, Dict, Any
import logging

import numpy as np

try:
    import torch
    from torch import Tensor, randn_like, random
    from botorch.models import SingleTaskGP
    from botorch.fit import fit_gpytorch_mll
    from botorch.models.transforms import Warp
    from botorch.sampling import SobolQMCNormalSampler
    from botorch.utils.transforms import normalize
    from botorch.utils.multi_objective.box_decompositions import (
        NondominatedPartitioning,
    )
    from botorch.acquisition.multi_objective.monte_carlo import (
        qExpectedHypervolumeImprovement,
    )
    from botorch.optim import optimize_acqf
    from botorch.exceptions.errors import ModelFittingError
    from gpytorch.mlls import ExactMarginalLogLikelihood
    from linear_operator.utils.errors import NotPSDError

except ImportError as e:
    logging.debug(e)

from syne_tune.optimizer.schedulers.searchers.searcher import BaseSearcher

from syne_tune.optimizer.schedulers.searchers.utils import (
    make_hyperparameter_ranges,
)

logger = logging.getLogger(__name__)


NOISE_LEVEL = 1e-3
MC_SAMPLES = 128



[docs]
class ExpectedHyperVolumeImprovement(BaseSearcher):
    """
    Implementation of expected hypervolume improvement [1] based on the BOTorch implementation.

    [1] S. Daulton, M. Balandat, and E. Bakshy.
    Differentiable Expected Hypervolume Improvement for Parallel Multi-Objective
    Bayesian Optimization.
    Advances in Neural Information Processing Systems 33, 2020.

    Additional arguments on top of parent class
    :class:`~syne_tune.optimizer.schedulers.searchers.StochasticAndFilterDuplicatesSearcher`:

    :param mode: "min" (default) or "max"
    :param num_init_random: :meth:`get_config` returns randomly drawn
        configurations until at least ``init_random`` observations have been
        recorded in :meth:`update`. After that, the BOTorch algorithm is used.
        Defaults to 3
    :param no_fantasizing: If ``True``, fantasizing is not done and pending
        evaluations are ignored. This may lead to loss of diversity in
        decisions. Defaults to ``False``
    :param max_num_observations: Maximum number of observation to use when
        fitting the GP. If the number of observations gets larger than this
        number, then data is subsampled. If ``None``, then all data is used to
        fit the GP. Defaults to 200
    :param input_warping: Whether to apply input warping when fitting the GP.
        Defaults to ``True``
    """

    def __init__(
        self,
        config_space: Dict[str, Any],
        points_to_evaluate: Optional[List[dict]] = None,
        num_init_random: int = 3,
        no_fantasizing: bool = False,
        max_num_observations: Optional[int] = 200,
        input_warping: bool = True,
        random_seed: int = None,
    ):
        super(ExpectedHyperVolumeImprovement, self).__init__(
            config_space,
            points_to_evaluate=points_to_evaluate,
            random_seed=random_seed,
        )
        assert num_init_random >= 2

        self.num_minimum_observations = num_init_random
        self.fantasising = not no_fantasizing
        self.max_num_observations = max_num_observations
        self.input_warping = input_warping
        self.trial_configs = dict()
        self.pending_trials = set()
        self.trial_observations = dict()
        self._hp_ranges = make_hyperparameter_ranges(config_space)

        # Set the random seed for botorch as well
        random.manual_seed(self.random_seed)
        self.random_state = np.random.RandomState(self.random_seed)


[docs]
    def on_trial_complete(
        self, trial_id: int, config: Dict[str, Any], metrics: List[float]
    ):

        self.trial_observations[trial_id] = metrics

        if trial_id in self.pending_trials:
            self.pending_trials.remove(trial_id)



[docs]
    def num_suggestions(self):
        return len(self.trial_configs)



[docs]
    def suggest(self) -> Optional[dict]:
        config_suggested = self._next_points_to_evaluate()

        if config_suggested is None:
            if self.objectives().shape[0] < self.num_minimum_observations:
                config_suggested = self._get_random_config()
            else:
                config_suggested = self._sample_next_candidate()

        if config_suggested is not None:
            trial_id = len(self.trial_configs)

            self.trial_configs[trial_id] = config_suggested

        return config_suggested



[docs]
    def register_pending(
        self,
        trial_id: str,
        config: Optional[dict] = None,
        milestone: Optional[int] = None,
    ):
        self.pending_trials.add(int(trial_id))



[docs]
    def evaluation_failed(self, trial_id: str):
        self.cleanup_pending(trial_id)



[docs]
    def cleanup_pending(self, trial_id: str):
        trial_id = int(trial_id)
        if trial_id in self.pending_trials:
            self.pending_trials.remove(trial_id)



[docs]
    def dataset_size(self):
        return len(self.trial_observations)


    def _get_gp_bounds(self):
        return Tensor(self._hp_ranges.get_ndarray_bounds()).T

    def _config_from_ndarray(self, candidate) -> dict:
        return self._hp_ranges.from_ndarray(candidate)

    def _get_random_config(self):
        return {
            k: v.sample() if hasattr(v, "sample") else v
            for k, v in self.config_space.items()
        }

    def _sample_next_candidate(self) -> Optional[dict]:
        """
        :return: A next candidate to evaluate, if possible it is obtained by
            fitting a GP on past data and maximizing EI. If this fails because
            of numerical difficulties with non PSD matrices, then the candidate
            is sampled at random.
        """
        try:
            X = np.array(self._config_to_feature_matrix(self._configs_with_results()))
            Y = Tensor(self.objectives())
            # BoTorch only supports maximization
            Y *= -1

            if (
                self.max_num_observations is not None
                and len(X) >= self.max_num_observations
            ):
                perm = self.random_state.permutation(len(X))[
                    : self.max_num_observations
                ]
                X = X[perm]
                Y = Y[perm]
                subsample = True
            else:
                subsample = False

            X_tensor = Tensor(X)
            bounds = torch.stack([Y.min(0).values, Y.max(0).values])

            noise_std = NOISE_LEVEL
            Y += noise_std * randn_like(Y)
            Y_tensor = normalize(Y, bounds=bounds)
            gp = self._make_gp(X_tensor=X_tensor, Y_tensor=Y_tensor)
            mll = ExactMarginalLogLikelihood(gp.likelihood, gp)
            fit_gpytorch_mll(mll, max_attempts=1)

            if self.pending_trials and self.fantasising and not subsample:
                X_pending = self._config_to_feature_matrix(self._configs_pending())
            else:
                X_pending = None
            sampler = SobolQMCNormalSampler(torch.Size([MC_SAMPLES]))

            ref_point = torch.ones(Y.shape[1]) * 2

            partitioning = NondominatedPartitioning(ref_point=ref_point, Y=Y_tensor)
            acq_func = qExpectedHypervolumeImprovement(
                model=gp,
                ref_point=ref_point,  # use known reference point
                partitioning=partitioning,
                sampler=sampler,
            )

            candidate, acq_value = optimize_acqf(
                acq_func,
                bounds=self._get_gp_bounds(),
                q=1,
                num_restarts=3,
                raw_samples=100,
            )
            candidate = candidate.detach().numpy()[0]
            return self._config_from_ndarray(candidate)

        except NotPSDError as _:
            logging.warning("Chlolesky inversion failed, sampling randomly.")
            return self._get_random_config()
        except ModelFittingError as _:
            logging.warning("Botorch was unable to fit the model, sampling randomly.")
            return self._get_random_config()
        except:
            # BoTorch can raise different errors, easier to not try to catch them individually
            logging.warning("Botorch was unable to fit the model, sampling randomly.")
            return self._get_random_config()

    def _make_gp(self, X_tensor, Y_tensor):
        double_precision = False
        if double_precision:
            X_tensor = X_tensor.double()
            Y_tensor = Y_tensor.double()

        if self.input_warping:
            warp_tf = Warp(indices=list(range(X_tensor.shape[-1])))
        else:
            warp_tf = None
        return SingleTaskGP(X_tensor, Y_tensor, input_transform=warp_tf)

    def _config_to_feature_matrix(self, configs: List[dict]):
        bounds = Tensor(self._hp_ranges.get_ndarray_bounds()).T
        X = Tensor(self._hp_ranges.to_ndarray_matrix(configs))
        return normalize(X, bounds)


[docs]
    def objectives(self):
        return np.array(list(self.trial_observations.values()))


    def _configs_with_results(self) -> List[dict]:
        return [
            config
            for trial, config in self.trial_configs.items()
            if not trial in self.pending_trials
        ]

    def _configs_pending(self) -> List[dict]:
        return [
            config
            for trial, config in self.trial_configs.items()
            if trial in self.pending_trials
        ]