Source code for shapiq.utils.sets

"""This module contains utility functions for dealing with sets, coalitions and game theory."""

from __future__ import annotations

import copy
from itertools import chain, combinations
from typing import TYPE_CHECKING, TypeVar

import numpy as np
from scipy.special import binom, gammaln

if TYPE_CHECKING:
    from collections.abc import Collection, Iterable, Iterator

    from shapiq.typing import CoalitionMatrix, CoalitionTuple

__all__ = [
    "count_interactions",
    "generate_interaction_lookup",
    "get_explicit_subsets",
    "log_binom",
    "pair_subset_sizes",
    "powerset",
    "split_subsets_budget",
    "transform_array_to_coalitions",
    "transform_coalitions_to_array",
]

T = TypeVar("T", int, str)



[docs]
def log_binom(n: int, k: int | np.ndarray) -> float | np.ndarray:
    """Natural logarithm of the binomial coefficient ``log(binom(n, k))``.

    Computed via :func:`scipy.special.gammaln` as
    ``gammaln(n + 1) - gammaln(k + 1) - gammaln(n - k + 1)``. This stays finite for large ``n``
    where :func:`scipy.special.binom` overflows to ``inf`` (the central coefficient
    ``binom(n, n/2)`` exceeds the float64 range already at ``n`` of roughly ``1029``). Keeping the
    binomial in log-space lets the Shapley/SII weights and the sampling probabilities -- whose
    ratios stay well-scaled even when the individual coefficients are astronomically large -- be
    combined without intermediate overflow/underflow.

    Args:
        n: The number of elements (a non-negative integer).
        k: The number of chosen elements. May be a scalar or a numpy array. Entries outside
            ``[0, n]`` yield ``-inf`` (i.e. ``binom(n, k) == 0``).

    Returns:
        ``log(binom(n, k))`` as a float (scalar ``k``) or a numpy array (array ``k``).

    """
    k_arr = np.asarray(k, dtype=np.float64)
    valid = (k_arr >= 0) & (k_arr <= n)
    with np.errstate(invalid="ignore"):
        result = gammaln(n + 1) - gammaln(k_arr + 1) - gammaln(n - k_arr + 1)
    result = np.where(valid, result, -np.inf)
    if np.ndim(k) == 0:
        return float(result)
    return result




[docs]
def powerset(
    iterable: Iterable[T],
    min_size: int = 0,
    max_size: int | None = None,
) -> Iterator[tuple[T, ...]]:
    """Return a powerset of an iterable as tuples with optional size limits.

    Args:
        iterable: An iterable (e.g., list, set, etc.) from which to generate the powerset.
        min_size: Minimum size of the subsets. Defaults to 0 (start with the empty set).
        max_size: Maximum size of the subsets. Defaults to None (all possible sizes).

    Returns:
        iterable: Powerset of the iterable.

    Example:
        >>> list(powerset([1, 2, 3]))
        [(), (1,), (2,), (3,), (1, 2), (1, 3), (2, 3), (1, 2, 3)]

        >>> list(powerset([1, 2, 3], min_size=1))
        [(1,), (2,), (3,), (1, 2), (1, 3), (2, 3), (1, 2, 3)]

        >>> list(powerset([1, 2, 3], max_size=2))
        [(), (1,), (2,), (3,), (1, 2), (1, 3), (2, 3)]

        >>> list(powerset(["A", "B", "C"], min_size=1, max_size=2))
        [('A',), ('B',), ('C',), ('A', 'B'), ('A', 'C'), ('B', 'C')]

    """
    s = sorted(iterable)
    max_size = len(s) if max_size is None else min(max_size, len(s))
    return chain.from_iterable(combinations(s, r) for r in range(max(min_size, 0), max_size + 1))




[docs]
def pair_subset_sizes(order: int, n: int) -> tuple[list[tuple[int, int]], int | None]:
    """Determines what subset sizes are paired together.

    Given an interaction order and the number of players, determines the paired subsets. Paired
    subsets are subsets of the same size that are paired together moving from the smallest subset
    paired with the largest subset to the center.

    Args:
        order: interaction order.
        n: number of players.

    Returns:
        paired and unpaired subsets. If there is no unpaired subset `unpaired_subset` is None.

    Examples:
        >>> pair_subset_sizes(order=1, n=5)
        ([(1, 4), (2, 3)], None)

        >>> pair_subset_sizes(order=1, n=6)
        ([(1, 5), (2, 4)], 3)

        >>> pair_subset_sizes(order=2, n=5)
        ([(2, 3)], None)

    """
    subset_sizes = list(range(order, n - order + 1))
    n_paired_subsets = len(subset_sizes) // 2
    paired_subsets = [
        (subset_sizes[size - 1], subset_sizes[-size]) for size in range(1, n_paired_subsets + 1)
    ]
    unpaired_subset = None if len(subset_sizes) % 2 == 0 else subset_sizes[n_paired_subsets]
    return paired_subsets, unpaired_subset




[docs]
def split_subsets_budget(
    order: int,
    n: int,
    budget: int,
    sampling_weights: np.ndarray,
) -> tuple[list, list, int]:
    """Determines which subset sizes can be computed explicitly and which sizes need to be sampled.

    Given a computational budget, determines the complete subsets that can be computed explicitly
    and the corresponding incomplete subsets that need to be estimated via sampling.

    Args:
        order: interaction order.
        n: number of players.
        budget: total allowed budget for the computation.
        sampling_weights: weight vector of the sampling distribution in shape (n + 1,). The first
            and last element constituting the empty and full subsets are not used.

    Returns:
        complete subsets, incomplete subsets, remaining budget

    Examples:
        >>> split_subsets_budget(order=1, n=6, budget=100, sampling_weights=np.ones(shape=(6,)))
        ([1, 5, 2, 4, 3], [], 38)

        >>> split_subsets_budget(order=1, n=6, budget=60, sampling_weights=np.ones(shape=(6,)))
        ([1, 5, 2, 4], [3], 18)

        >>> split_subsets_budget(order=1, n=6, budget=100, sampling_weights=np.zeros(shape=(6,)))
        ([], [1, 2, 3, 4, 5], 100)

    """
    # determine paired and unpaired subsets
    complete_subsets: list[int] = []
    paired_subsets, unpaired_subset = pair_subset_sizes(order, n)
    incomplete_subsets = list(range(order, n - order + 1))

    # turn weight vector into probability vector
    weight_vector = copy.copy(sampling_weights)
    weight_vector[0], weight_vector[-1] = 0, 0  # zero out the empty and full subsets
    sum_weight_vector = np.sum(weight_vector)
    weight_vector = np.divide(
        weight_vector,
        sum_weight_vector,
        out=weight_vector,
        where=sum_weight_vector != 0,
    )

    # check if the budget is sufficient to compute all paired subset sizes explicitly
    allowed_budget = weight_vector * budget  # allowed budget for each subset size
    for subset_size_1, subset_size_2 in paired_subsets:
        subset_budget = int(binom(n, subset_size_1))  # required budget for full computation
        # check if the budget is sufficient to compute the paired subset sizes explicitly
        if allowed_budget[subset_size_1] >= subset_budget and allowed_budget[subset_size_1] > 0:
            complete_subsets.extend((subset_size_1, subset_size_2))
            incomplete_subsets.remove(subset_size_1)
            incomplete_subsets.remove(subset_size_2)
            weight_vector[subset_size_1], weight_vector[subset_size_2] = 0, 0  # zero used sizes
            if np.sum(weight_vector) != 0:
                weight_vector /= np.sum(weight_vector)  # re-normalize into probability vector
            budget -= subset_budget * 2
        else:  # if the budget is not sufficient, return the current state
            return complete_subsets, incomplete_subsets, budget
        allowed_budget = weight_vector * budget  # update allowed budget for each subset size

    # check if the budget is sufficient to compute the unpaired subset size explicitly
    if unpaired_subset is not None:
        subset_budget = int(binom(n, unpaired_subset))
        if budget - subset_budget >= 0:
            complete_subsets.append(unpaired_subset)
            incomplete_subsets.remove(unpaired_subset)
            budget -= subset_budget
    return complete_subsets, incomplete_subsets, budget




[docs]
def get_explicit_subsets(n: int, subset_sizes: list[int]) -> np.ndarray:
    """Enumerates all subsets of the given sizes and returns a one-hot matrix.

    Args:
        n: number of players.
        subset_sizes: list of subset sizes.

    Returns:
        one-hot matrix of all subsets of certain sizes.

    Examples:
        >>> get_explicit_subsets(n=4, subset_sizes=[1, 2]).astype(int)
        array([[1, 0, 0, 0],
               [0, 1, 0, 0],
               [0, 0, 1, 0],
               [0, 0, 0, 1],
               [1, 1, 0, 0],
               [1, 0, 1, 0],
               [1, 0, 0, 1],
               [0, 1, 1, 0],
               [0, 1, 0, 1],
               [0, 0, 1, 1]])

    """
    total_subsets = int(sum(binom(n, size) for size in subset_sizes))
    subset_matrix = np.zeros(shape=(total_subsets, n), dtype=bool)
    subset_index = 0
    for subset_size in subset_sizes:
        for subset in combinations(range(n), subset_size):
            subset_matrix[subset_index, subset] = True
            subset_index += 1
    return subset_matrix




[docs]
def generate_interaction_lookup(
    players: Iterable[T] | int,
    min_order: int,
    max_order: int | None = None,
) -> dict[tuple[T, ...], int] | dict[tuple[int, ...], int]:
    """Generates a lookup dictionary for interactions.

    Args:
        players: A unique set of players or an Integer denoting the number of players.
        min_order: The minimum order of the approximation.
        max_order: The maximum order of the approximation.

    Returns:
        A dictionary that maps interactions to their index in the values vector.

    Example:
        >>> generate_interaction_lookup(3, 1, 3)
        {(0,): 0, (1,): 1, (2,): 2, (0, 1): 3, (0, 2): 4, (1, 2): 5, (0, 1, 2): 6}
        >>> generate_interaction_lookup(3, 2, 2)
        {(0, 1): 0, (0, 2): 1, (1, 2): 2}
        >>> generate_interaction_lookup(["A", "B", "C"], 1, 2)
        {('A',): 0, ('B',): 1, ('C',): 2, ('A', 'B'): 3, ('A', 'C'): 4, ('B', 'C'): 5}

    """
    if isinstance(players, int):
        return {
            interaction: i
            for i, interaction in enumerate(
                powerset(range(players), min_size=min_order, max_size=max_order)
            )
        }
    return {
        interaction: i
        for i, interaction in enumerate(powerset(players, min_size=min_order, max_size=max_order))
    }




[docs]
def generate_interaction_lookup_from_coalitions(
    coalitions: CoalitionMatrix,
) -> dict[tuple[int, ...], int]:
    """Generates a lookup dictionary for interactions based on an array of coalitions.

    Args:
        coalitions: An array of player coalitions.

    Returns:
        A dictionary that maps interactions to their index in the values vector

    Example:
        >>> coalitions = np.array([
        ...     [1, 0, 1],
        ...     [0, 1, 1],
        ...     [1, 1, 0],
        ...     [0, 0, 1]
        ... ])
        >>> generate_interaction_lookup_from_coalitions(coalitions)
        {(0, 2): 0, (1, 2): 1, (0, 1): 2, (2,): 3}

    """
    return {tuple(np.where(coalition)[0]): idx for idx, coalition in enumerate(coalitions)}




[docs]
def transform_coalitions_to_array(
    coalitions: Collection[CoalitionTuple],
    n_players: int | None = None,
) -> CoalitionMatrix:
    """Transforms a collection of coalitions to a binary array (one-hot encodings).

    Args:
        coalitions: Collection of coalitions.
        n_players: Number of players. Defaults to None (determined from the coalitions). If
            provided, n_players must be greater than the maximum player index in the coalitions.

    Returns:
        Binary array of coalitions.

    Example:
        >>> coalitions = [(0, 1), (1, 2), (0, 2)]
        >>> transform_coalitions_to_array(coalitions)
        array([[ True,  True, False],
               [False,  True,  True],
               [ True, False,  True]])

        >>> transform_coalitions_to_array(coalitions, n_players=4)
        array([[ True,  True, False, False],
               [False,  True,  True, False],
               [ True, False,  True, False]])

    """
    n_coalitions = len(coalitions)
    if n_players is None:
        n_players = max(max(coalition) for coalition in coalitions) + 1

    coalition_array = np.zeros((n_coalitions, n_players), dtype=bool)
    for i, coalition in enumerate(coalitions):
        coalition_array[i, coalition] = True
    return coalition_array




[docs]
def transform_array_to_coalitions(coalitions: CoalitionMatrix) -> Collection[CoalitionTuple]:
    """Transforms a 2d one-hot matrix of coalitions into a list of tuples.

    Args:
        coalitions: A binary array of coalitions.

    Returns:
        List of coalitions as tuples.

    Examples:
        >>> coalitions = np.array([[True, True, False], [False, True, True], [True, False, True]])
        >>> transform_array_to_coalitions(coalitions)
        [(0, 1), (1, 2), (0, 2)]

        >>> coalitions = np.array([[False, False, False], [True, True, True]])
        >>> transform_array_to_coalitions(coalitions)
        [(), (0, 1, 2)]

    """
    return [tuple(np.where(coalition)[0]) for coalition in coalitions]




[docs]
def count_interactions(n: int, max_order: int | None = None, min_order: int = 0) -> int:
    """Counts the number of interactions for a given number of players and maximum order.

    Args:
        n: Number of players.
        max_order: Maximum order of the interactions. If `None`, it is set to the number of players.
            Defaults to `None`.
        min_order: Minimum order of the interactions. Defaults to 0.

    Returns:
        The number of interactions.

    Examples:
        >>> count_interactions(3)
        8
        >>> count_interactions(3, 2)
        7
        >>> count_interactions(3, 2, 1)
        6

    """
    if max_order is None:
        max_order = n
    return int(sum(binom(n, size) for size in range(min_order, max_order + 1)))