Epsnet

Implements an epsilon-net based multi-objective sort. Source: github.com/syne-tune/syne-tune/blob/main/syne_tune/optimizer/schedulers/multiobjective/non_dominated_priority.py Proposed in the paper: arxiv.org/pdf/2106.12639

compute_epsilon_net #

compute_epsilon_net(
    X: ndarray, dim: int | None = None
) -> ndarray

Outputs an order of the items in the provided array such that the items are spaced well. This means that after choosing a seed item, the next item is chosen to be the farthest from the seed item. The third item is then chosen to maximize the distance to the existing points and so on.

This algorithm is taken from "Nearest-Neighbor Searching and Metric Space Dimensions" (Clarkson, 2005, p.17).

Parameters#

X: np.ndarray [N, D] The items to sparsify where N is the number of items and D their dimensionality. dim: Optional[int], default: None The index of the dimension which to use to choose the seed item. If None, an item is chosen at random, otherwise the item with the lowest value in the specified dimension is used.

Returns#

np.ndarray [N] A list of item indices, defining a sparsified order of the items.

Source code in neps/optimizers/utils/multiobjective/epsnet.py

def compute_epsilon_net(X: np.ndarray, dim: int | None = None) -> np.ndarray:
    """
    Outputs an order of the items in the provided array such that the items are
    spaced well. This means that after choosing a seed item, the next item is
    chosen to be the farthest from the seed item. The third item is then chosen
    to maximize the distance to the existing points and so on.

    This algorithm is taken from "Nearest-Neighbor Searching and Metric Space Dimensions"
    (Clarkson, 2005, p.17).

    Parameters
    ----------
    X: np.ndarray [N, D]
        The items to sparsify where N is the number of items and D their dimensionality.
    dim: Optional[int], default: None
        The index of the dimension which to use to choose the seed item.
        If ``None``, an item is chosen at random, otherwise the item with the
        lowest value in the specified dimension is used.

    Returns
    -------
    np.ndarray [N]
        A list of item indices, defining a sparsified order of the items.
    """
    indices = set(range(X.shape[0]))

    # Choose the seed item according to dim
    if dim is None:
        initial_index = np.random.choice(X.shape[0])
    else:
        initial_index = np.argmin(X, axis=0)[dim]

    # Initialize the order
    order = [initial_index]
    indices.remove(initial_index)

    # Iterate until all models have been chosen
    while indices:
        # Get the distance to all items that have already been chosen
        ordered_indices = list(indices)
        diff = X[ordered_indices][:, None, :].repeat(len(order), axis=1) - X[order]
        min_distances = np.linalg.norm(diff, axis=-1).min(-1)

        # Then, choose the one with the maximum distance to all points
        choice = ordered_indices[min_distances.argmax()]
        order.append(choice)
        indices.remove(choice)

    # convert argsort indices to rank
    ranks = np.empty(len(order), dtype=int)
    for rank, i in enumerate(order):
        ranks[i] = rank
    return np.array(ranks)

nondominated_sort #

nondominated_sort(
    X: ndarray,
    dim: int | None = None,
    max_items: int | None = None,
    *,
    flatten: bool = True
) -> list[int] | list[list[int]]

Performs a multi-objective sort by iteratively computing the Pareto front and sparsifying the items within the Pareto front. This is a non-dominated sort leveraging an epsilon-net.

Parameters#

X: np.ndarray [N, D] The multi-dimensional items to sort. dim: Optional[int], default: None The feature (metric) to prefer when ranking items within the Pareto front. If None, items are chosen randomly. max_items: Optional[int], default: None The maximum number of items that should be returned. When this is None, all items are sorted. flatten: bool, default: True Whether to flatten the resulting array.

Returns#

Union[List[int], List[List[int]]] The indices of the sorted items, either globally or within each of the Pareto front depending on the value of flatten.

Source code in neps/optimizers/utils/multiobjective/epsnet.py

def nondominated_sort(
    X: np.ndarray,
    dim: int | None = None,
    max_items: int | None = None,
    *,
    flatten: bool = True,
) -> list[int] | list[list[int]]:
    """
    Performs a multi-objective sort by iteratively computing the Pareto front
    and sparsifying the items within the Pareto front. This is a non-dominated sort
    leveraging an epsilon-net.

    Parameters
    ----------
    X: np.ndarray [N, D]
        The multi-dimensional items to sort.
    dim: Optional[int], default: None
        The feature (metric) to prefer when ranking items within the Pareto front.
        If ``None``, items are chosen randomly.
    max_items: Optional[int], default: None
        The maximum number of items that should be returned.
        When this is ``None``, all items are sorted.
    flatten: bool, default: True
        Whether to flatten the resulting array.

    Returns
    -------
    Union[List[int], List[List[int]]]
        The indices of the sorted items, either globally or within each of the
        Pareto front depending on the value of ``flatten``.
    """
    remaining = np.arange(X.shape[0])
    indices = []
    num_items = 0

    # Iterate until max_items are reached or there are no items left
    while remaining.size > 0 and (max_items is None or num_items < max_items):
        # Compute the Pareto front and sort the items within
        pareto_mask = pareto_efficient(X[remaining])
        pareto_front = remaining[pareto_mask]
        pareto_order = compute_epsilon_net(X[pareto_front], dim=dim)

        # Add order to the indices
        indices.append(pareto_front[pareto_order].tolist())
        num_items += len(pareto_front)

        # Remove items in the Pareto front from the remaining items
        remaining = remaining[~pareto_mask]

    # Restrict the number of items returned and optionally flatten
    if max_items is not None:
        limit = max_items - sum(len(x) for x in indices[:-1])
        indices[-1] = indices[-1][:limit]
        if not indices[-1]:
            indices = indices[:-1]

    if flatten:
        return [i for ix in indices for i in ix]
    return indices

pareto_efficient #

pareto_efficient(X: ndarray) -> ndarray

Evaluates for each allocation in the provided array whether it is Pareto efficient. The costs are assumed to be improved by lowering them (eg lower is better).

Parameters#

X: np.ndarray [N, D] The allocations to check where N is the number of allocations and D the number of costs per allocation.

Returns#

np.ndarray [N] A boolean array, indicating for each allocation whether it is Pareto efficient.

Source code in neps/optimizers/utils/multiobjective/epsnet.py

def pareto_efficient(X: np.ndarray) -> np.ndarray:
    """
    Evaluates for each allocation in the provided array whether it is Pareto efficient.
    The costs are assumed to be improved by lowering them (eg lower is better).

    Parameters
    ----------
    X: np.ndarray [N, D]
        The allocations to check where N is the number of allocations and D the number of
        costs per allocation.

    Returns
    -------
    np.ndarray [N]
        A boolean array, indicating for each allocation whether it is Pareto efficient.
    """
    # First, we assume that all allocations are Pareto efficient, i.e. not dominated
    mask = np.ones(X.shape[0], dtype=bool)
    # Then, we iterate over all allocations A and check which are dominated by then
    # current allocation A. If it is, we don't need to check it against another
    # allocation.
    for i, allocation in enumerate(X):
        # Only consider allocation if it hasn't been dominated yet
        if mask[i]:
            # An allocation is dominated by A if all costs are equal or lower
            # and at least one cost is strictly lower. Using that definition,
            # A cannot be dominated by itself.
            dominated = np.all(allocation <= X[mask], axis=1) * np.any(
                allocation < X[mask], axis=1
            )
            mask[mask] = ~dominated

    return mask