Source code for ribs.emitters.opt._evolution_strategy_base

"""Provides EvolutionStrategyBase."""
from abc import ABC, abstractmethod

import numpy as np

# Number of times solutions can be resampled before triggering a warning.
BOUNDS_SAMPLING_THRESHOLD = 100

# Warning for resampling solutions too many times.
BOUNDS_WARNING = (
    "During bounds handling, this ES resampled at least "
    f"{BOUNDS_SAMPLING_THRESHOLD} times. This may indicate that your solution "
    "space bounds are too tight. When bounds are passed in, the ES resamples "
    "until all solutions are within the bounds -- if the bounds are too tight "
    "or the distribution is too large, the ES will resample forever.")


[docs]class EvolutionStrategyBase(ABC): """Base class for evolution strategy optimizers for use with emitters. The basic usage is: - Initialize the optimizer and reset it. - Repeatedly: - Request new solutions with ``ask()`` - Rank the solutions in the emitter (better solutions come first) and pass the indices and values back with ``tell()``. - Use ``check_stop()`` to see if the optimizer has reached a stopping condition, and if so, call ``reset()``. Args: sigma0 (float): Initial step size. solution_dim (int): Size of the solution space. batch_size (int): Number of solutions to evaluate at a time. seed (int): Seed for the random number generator. dtype (str or data-type): Data type of solutions. lower_bounds (float or numpy.ndarray): scalar or (solution_dim,) array indicating lower bounds of the solution space. Scalars specify the same bound for the entire space, while arrays specify a bound for each dimension. Pass -np.inf in the array or scalar to indicated unbounded space. upper_bounds (float or numpy.ndarray): Same as above, but for upper bounds (and pass np.inf instead of -np.inf). """ def __init__(self, sigma0, solution_dim, batch_size=None, seed=None, dtype=np.float64, lower_bounds=-np.inf, upper_bounds=np.inf): pass
[docs] @abstractmethod def reset(self, x0): """Resets the ES to start at x0. Args: x0 (numpy.ndarray): Initial mean. """
[docs] @abstractmethod def check_stop(self, ranking_values): """Checks if the ES should stop and be reset. Args: ranking_values (numpy.ndarray): Array of values that were used to rank the solutions. Shape can be either ``(batch_size,)`` or (batch_size, n_values)``, where ``batch_size`` is the number of solutions and ``n_values`` is the number of values that the ranker used. Note that unlike in :meth:`tell`, these values must be sorted according to the ``ranking_indices`` passed to :meth:`tell`. Returns: True if any of the stopping conditions are satisfied. """
[docs] @abstractmethod def ask(self, batch_size=None): """Samples new solutions. Args: batch_size (int): batch size of the sample. Defaults to ``self.batch_size``. """
[docs] @abstractmethod def tell(self, ranking_indices, ranking_values, num_parents): """Passes the solutions back to the ES. Args: ranking_indices (numpy.ndarray): Integer indices that are used to rank the solutions returned in :meth:`ask`. Note that these are NOT the ranks of the solutions. Rather, they are indices such that ``solutions[ranking_indices]`` will correctly rank the solutions (think of an argsort). ranking_values (numpy.ndarray): Array of values that were used to rank the solutions. Shape can be either ``(batch_size,)`` or (batch_size, n_values)``, where ``batch_size`` is the number of solutions and ``n_values`` is the number of values that the ranker used. Note that we assume a descending sort, i.e., higher values should come first. num_parents (int): Number of top solutions to select from the ranked solutions. """