diff --git a/package/samplers/hebo/sampler.py b/package/samplers/hebo/sampler.py index b76cd5bf..e9d61123 100644 --- a/package/samplers/hebo/sampler.py +++ b/package/samplers/hebo/sampler.py @@ -1,13 +1,19 @@ from __future__ import annotations from collections.abc import Sequence +from typing import Any +import warnings import numpy as np +import optuna from optuna.distributions import BaseDistribution from optuna.distributions import CategoricalDistribution from optuna.distributions import FloatDistribution from optuna.distributions import IntDistribution +from optuna.samplers import BaseSampler +from optuna.search_space import IntersectionSearchSpace from optuna.study import Study +from optuna.study._study_direction import StudyDirection from optuna.trial import FrozenTrial from optuna.trial import TrialState import optunahub @@ -18,11 +24,70 @@ class HEBOSampler(optunahub.samplers.SimpleBaseSampler): - def __init__(self, search_space: dict[str, BaseDistribution]) -> None: - super().__init__(search_space) - self._hebo = HEBO(self._convert_to_hebo_design_space(search_space)) + """A sampler using `HEBO __` as the backend. - def sample_relative( + For further information about HEBO algorithm, please refer to the following papers: + - `Cowen-Rivers, Alexander I., et al. An Empirical Study of Assumptions in Bayesian Optimisation. arXiv preprint arXiv:2012.03826 (2021).__` + + Args: + search_space: + A search space required for Define-and-Run manner. Default is :obj:`None`. + + seed: + A seed for ``HEBOSampler``. Default is :obj:`None`. + + constant_liar: + If :obj:`True`, penalize running trials to avoid suggesting parameter configurations + nearby. Default is :obj:`False`. + + .. note:: + Abnormally terminated trials often leave behind a record with a state of + ``RUNNING`` in the storage. + Such "zombie" trial parameters will be avoided by the constant liar algorithm + during subsequent sampling. + When using an :class:`~optuna.storages.RDBStorage`, it is possible to enable the + ``heartbeat_interval`` to change the records for abnormally terminated trials to + ``FAIL``. + (This note is quoted from `TPESampler __`.) + + .. note:: + It is recommended to set this value to :obj:`True` during distributed + optimization to avoid having multiple workers evaluating similar parameter + configurations. In particular, if each objective function evaluation is costly + and the durations of the running states are significant, and/or the number of + workers is high. + (This note is quoted from `TPESampler __`.) + + .. note:: + HEBO algorithm involves multi-objective optimization of multiple acquisition functions. + While `constant_liar` is a simple way to get diverse params for parallel optimization, + it may not be the best approach for HEBO. + + independent_sampler: + A :class:`~optuna.samplers.BaseSampler` instance that is used for independent + sampling. The parameters not contained in the relative search space are sampled + by this sampler. If :obj:`None` is specified, :class:`~optuna.samplers.RandomSampler` + is used as the default. + """ # NOQA + def __init__(self, + search_space: dict[str, BaseDistribution] | None = None, + seed: int | None = None, + constant_liar: bool = False, + independent_sampler: BaseSampler | None = None, + ) -> None: + super().__init__(search_space, seed) + if search_space is not None and constant_liar is False: + self._hebo = HEBO(self._convert_to_hebo_design_space(search_space), scramble_seed=seed) + else: + self._hebo = None + self._intersection_search_space = IntersectionSearchSpace() + self._independent_sampler = ( + independent_sampler or optuna.samplers.RandomSampler(seed=seed) + ) + self._is_independent_sampler_specified = independent_sampler is not None + self._constant_liar = constant_liar + + def _sample_relative_define_and_run( self, study: Study, trial: FrozenTrial, search_space: dict[str, BaseDistribution] ) -> dict[str, float]: params_pd = self._hebo.suggest() @@ -32,6 +97,72 @@ def sample_relative( params[name] = params_pd[name].to_numpy()[0] return params + def _sample_relative_stateless( + self, study: Study, trial: FrozenTrial, search_space: dict[str, BaseDistribution] + ) -> dict[str, float]: + if self._constant_liar: + target_states = [TrialState.COMPLETE, TrialState.RUNNING] + else: + target_states = [TrialState.COMPLETE] + + trials = study.get_trials(deepcopy=False, states=target_states) + if len([t for t in trials if t.state == TrialState.COMPLETE]) < 1: + # note: The backend HEBO implementation use Sobol sampling here. + # This sampler does not call `hebo.suggest()` here because + # Optuna needs to know search space by running the first trial in Define-by-Run. + return {} + + # Assume that the back-end HEBO implementation aims to minimize. + if study.direction == StudyDirection.MINIMIZE: + worst_values = max( + [t.values for t in trials if t.state == TrialState.COMPLETE] + ) + else: + worst_values = min( + [t.values for t in trials if t.state == TrialState.COMPLETE] + ) + sign = 1 if study.direction == StudyDirection.MINIMIZE else -1 + + hebo = HEBO( + self._convert_to_hebo_design_space(search_space), scramble_seed=self._seed + ) + for t in trials: + if t.state == TrialState.COMPLETE: + hebo_params = {name: t.params[name] for name in search_space.keys()} + hebo.observe( + pd.DataFrame([hebo_params]), + np.asarray([x * sign for x in t.values]), + ) + elif t.state == TrialState.RUNNING: + try: + hebo_params = {name: t.params[name] for name in search_space.keys()} + except: # NOQA + # There are one or more params which are not suggested yet. + continue + # If `constant_liar == True`, assume that the RUNNING params result in bad values, + # thus preventing the simultaneous suggestion of (almost) the same params + # during parallel execution. + hebo.observe(pd.DataFrame([hebo_params]), np.asarray([worst_values])) + else: + assert False + params_pd = hebo.suggest() + params = {} + for name in search_space.keys(): + params[name] = params_pd[name].to_numpy()[0] + return params + + def sample_relative( + self, study: Study, trial: FrozenTrial, search_space: dict[str, BaseDistribution] + ) -> dict[str, float]: + if study._is_multi_objective(): + raise ValueError( + "This function does not support multi-objective optimization study." + ) + if self._hebo is None or self._constant_liar is True: + return self._sample_relative_stateless(study, trial, search_space) + else: + return self._sample_relative_define_and_run(study, trial, search_space) + def after_trial( self, study: Study, @@ -39,7 +170,11 @@ def after_trial( state: TrialState, values: Sequence[float] | None, ) -> None: - self._hebo.observe(pd.DataFrame([trial.params]), np.asarray([values])) + if self._hebo is not None: + # Assume that the back-end HEBO implementation aims to minimize. + if study.direction == StudyDirection.MAXIMIZE: + values = [-x for x in values] + self._hebo.observe(pd.DataFrame([trial.params]), np.asarray([values])) def _convert_to_hebo_design_space( self, search_space: dict[str, BaseDistribution] @@ -103,3 +238,26 @@ def _convert_to_hebo_design_space( else: raise NotImplementedError(f"Unsupported distribution: {distribution}") return DesignSpace().parse(design_space) + + def infer_relative_search_space( + self, study: Study, trial: FrozenTrial + ) -> dict[str, BaseDistribution]: + return optuna.search_space.intersection_search_space( + study._get_trials(deepcopy=False, use_cache=True) + ) + + def sample_independent( + self, + study: Study, + trial: FrozenTrial, + param_name: str, + param_distribution: BaseDistribution, + ) -> Any: + if not self._is_independent_sampler_specified: + warnings.warn( + "`HEBOSampler` falls back to `RandomSampler` due to dynamic search space. Is this intended?" + ) + + return self._independent_sampler.sample_independent( + study, trial, param_name, param_distribution + )