Source code for ribs.emitters.opt._evolution_strategy_base

"""Provides EvolutionStrategyBase."""
from abc import ABC, abstractmethod

import numpy as np

# Number of times solutions can be resampled before triggering a warning.
BOUNDS_SAMPLING_THRESHOLD = 100

# Warning for resampling solutions too many times.
BOUNDS_WARNING = (
    "During bounds handling, this ES resampled at least "
    f"{BOUNDS_SAMPLING_THRESHOLD} times. This may indicate that your solution "
    "space bounds are too tight. When bounds are passed in, the ES resamples "
    "until all solutions are within the bounds -- if the bounds are too tight "
    "or the distribution is too large, the ES will resample forever.")


[docs]class EvolutionStrategyBase(ABC):
    """Base class for evolution strategy optimizers for use with emitters.

    The basic usage is:

    - Initialize the optimizer and reset it.
    - Repeatedly:

        - Request new solutions with ``ask()``
        - Rank the solutions in the emitter (better solutions come first) and
          pass the indices and values back with ``tell()``.
        - Use ``check_stop()`` to see if the optimizer has reached a stopping
          condition, and if so, call ``reset()``.

    Args:
        sigma0 (float): Initial step size.
        solution_dim (int): Size of the solution space.
        batch_size (int): Number of solutions to evaluate at a time.
        seed (int): Seed for the random number generator.
        dtype (str or data-type): Data type of solutions.
        lower_bounds (float or numpy.ndarray): scalar or (solution_dim,) array
            indicating lower bounds of the solution space. Scalars specify
            the same bound for the entire space, while arrays specify a
            bound for each dimension. Pass -np.inf in the array or scalar to
            indicated unbounded space.
        upper_bounds (float or numpy.ndarray): Same as above, but for upper
            bounds (and pass np.inf instead of -np.inf).
    """

    def __init__(self,
                 sigma0,
                 solution_dim,
                 batch_size=None,
                 seed=None,
                 dtype=np.float64,
                 lower_bounds=-np.inf,
                 upper_bounds=np.inf):
        pass

[docs]    @abstractmethod
    def reset(self, x0):
        """Resets the ES to start at x0.

        Args:
            x0 (numpy.ndarray): Initial mean.
        """

[docs]    @abstractmethod
    def check_stop(self, ranking_values):
        """Checks if the ES should stop and be reset.

        Args:
            ranking_values (numpy.ndarray): Array of values that were used to
                rank the solutions. Shape can be either ``(batch_size,)`` or
                (batch_size, n_values)``, where ``batch_size`` is the number of
                solutions and ``n_values`` is the number of values that the
                ranker used. Note that unlike in :meth:`tell`, these values must
                be sorted according to the ``ranking_indices`` passed to
                :meth:`tell`.
        Returns:
            True if any of the stopping conditions are satisfied.
        """

[docs]    @abstractmethod
    def ask(self, batch_size=None):
        """Samples new solutions.

        Args:
            batch_size (int): batch size of the sample. Defaults to
                ``self.batch_size``.
        """

[docs]    @abstractmethod
    def tell(self, ranking_indices, ranking_values, num_parents):
        """Passes the solutions back to the ES.

        Args:
            ranking_indices (numpy.ndarray): Integer indices that are used to
                rank the solutions returned in :meth:`ask`. Note that these are
                NOT the ranks of the solutions. Rather, they are indices such
                that ``solutions[ranking_indices]`` will correctly rank the
                solutions (think of an argsort).
            ranking_values (numpy.ndarray): Array of values that were used to
                rank the solutions. Shape can be either ``(batch_size,)`` or
                (batch_size, n_values)``, where ``batch_size`` is the number of
                solutions and ``n_values`` is the number of values that the
                ranker used. Note that we assume a descending sort, i.e., higher
                values should come first.
            num_parents (int): Number of top solutions to select from the
                ranked solutions.
        """