Source code for deepobs.tuner.bayesian

# -*- coding: utf-8 -*-
import os

import bayes_opt
from bayes_opt import UtilityFunction

from .bayesian_utils import (
    _init_summary_directory,
    _save_bo_optimizer_object,
    _update_bo_tuning_summary,
)
from .tuner import Tuner
from .tuner_utils import rerun_setting


[docs]class GP(Tuner):
    """A Bayesian optimization tuner that uses a Gaussian Process surrogate.
    """

[docs]    def __init__(
        self,
        optimizer_class,
        hyperparam_names,
        bounds,
        ressources,
        runner,
        transformations=None,
    ):
        """
        Args:
            optimizer_class (framework optimizer class): The optimizer to tune.
            hyperparam_names (dict): Nested dictionary that holds the name, type and default values of the hyperparameters
            bounds (dict): A dict where the key is the hyperparameter name and the value is a tuple of its bounds.
            ressources (int): The number of total evaluations of the tuning process.
            transformations (dict): A dict where the key is the hyperparameter name and the value is a callable that returns \
            the transformed hyperparameter.
            runner: The DeepOBS runner which is used for each evaluation.
        """
        super(GP, self).__init__(optimizer_class, hyperparam_names, ressources, runner)
        self._bounds = bounds
        self._transformations = transformations

    @staticmethod
    def _determine_cost_from_output_and_mode(output, mode):
        # check if accuracy is available, else take loss
        if not "test_accuracies" in output:
            # -1 because bayes_opt looks for maximum of cost function
            cost = [-1 * v for v in output["test_losses"]]
        else:
            cost = output["test_accuracies"]

        if mode == "final":
            cost = cost[-1]
        elif mode == "best":
            cost = max(cost)
        else:
            raise NotImplementedError(
                """Mode not available for this tuning method. Please use final or best."""
            )
        return cost

    def _generate_cost_function(self, testproblem, output_dir, mode, **kwargs):
        def _cost_function(**hyperparams):
            # apply transformations if they exist
            if self._transformations is not None:
                for hp_name, hp_transform in self._transformations.items():
                    hyperparams[hp_name] = hp_transform(hyperparams[hp_name])
            runner = self._runner(self._optimizer_class, self._hyperparam_names)
            output = runner.run(
                testproblem, hyperparams, output_dir=output_dir, **kwargs
            )
            cost = self._determine_cost_from_output_and_mode(output, mode)
            return cost

        return _cost_function

    def _init_bo_space(
        self,
        op,
        cost_function,
        n_init_samples,
        log_path,
        plotting_summary,
        tuning_summary,
    ):

        for iteration in range(1, n_init_samples + 1):
            random_sample = op.space.random_sample()
            params = dict(sorted(zip(self._bounds, random_sample)))
            target = cost_function(**params)
            if tuning_summary:
                _update_bo_tuning_summary(op._gp, params, target, log_path)
            op.register(params, target)

            # fit gp on new registered points
            op._gp.fit(op._space.params, op._space.target)
            if plotting_summary:
                _save_bo_optimizer_object(
                    os.path.join(log_path, "obj"), str(iteration), op
                )

[docs]    def tune(
        self,
        testproblem,
        output_dir="./results",
        random_seed=42,
        n_init_samples=5,
        tuning_summary=True,
        plotting_summary=True,
        kernel=None,
        acq_type="ucb",
        acq_kappa=2.576,
        acq_xi=0.0,
        mode="final",
        rerun_best_setting=False,
        **kwargs
    ):

        """Tunes the optimizer hyperparameters by evaluating a Gaussian process surrogate with an acquisition function.
        Args:
            testproblem (str): The test problem to tune the optimizer on.
            output_dir (str): The output directory for the results.
            random_seed (int): Random seed for the whole truning process. Every individual run is seeded by it.
            n_init_samples (int): The number of random exploration samples in the beginning of the tuning process.
            tuning_summary (bool): Whether to write an additional tuning summary. Can be used to get an overview over the tuning progress
            plotting_summary (bool): Whether to store additional objects that can be used to plot the posterior.
            kernel (Sklearn.gaussian_process.kernels.Kernel): The kernel of the GP.
            acq_type (str): The type of acquisition function to use. Muste be one of ``ucb``, ``ei``, ``poi``.
            acq_kappa (float): Scaling parameter of the acquisition function.
            acq_xi (float): Scaling parameter of the acquisition function.
            mode (str): The mode that is used to evaluate the cost. Must be one of ``final`` or ``best``.
            rerun_best_setting (bool): Whether to automatically rerun the best setting with 10 different seeds.
            """

        self._set_seed(random_seed)
        log_path = os.path.join(output_dir, testproblem, self._optimizer_name)

        cost_function = self._generate_cost_function(
            testproblem, output_dir, mode, **kwargs
        )

        op = bayes_opt.BayesianOptimization(
            f=None, pbounds=self._bounds, random_state=random_seed
        )
        if kernel is not None:
            op._gp.kernel = kernel

        utility_func = UtilityFunction(acq_type, kappa=acq_kappa, xi=acq_xi)

        if tuning_summary:
            _init_summary_directory(log_path, "bo_tuning_log.json")
        if plotting_summary:
            _init_summary_directory(os.path.join(log_path, "obj"))
            _save_bo_optimizer_object(
                os.path.join(log_path, "obj"), "acq_func", utility_func
            )

        # evaluates the random points
        try:
            assert n_init_samples <= self._ressources
        except AssertionError:
            raise AssertionError(
                "Number of initial evaluations exceeds the ressources."
            )
        self._init_bo_space(
            op,
            cost_function,
            n_init_samples,
            log_path,
            plotting_summary,
            tuning_summary,
        )

        # execute remaining ressources
        for iteration in range(n_init_samples + 1, self._ressources + 1):
            next_point = op.suggest(utility_func)
            target = cost_function(**next_point)
            if tuning_summary:
                _update_bo_tuning_summary(op._gp, next_point, target, log_path)
            op.register(params=next_point, target=target)

            # fit gp on new registered points
            op._gp.fit(op._space.params, op._space.target)
            if plotting_summary:
                _save_bo_optimizer_object(
                    os.path.join(log_path, "obj"), str(iteration), op
                )

        if rerun_best_setting:
            optimizer_path = os.path.join(output_dir, testproblem, self._optimizer_name)
            rerun_setting(
                self._runner,
                self._optimizer_class,
                self._hyperparam_names,
                optimizer_path,
            )