Source code for shapiq.game_theory.moebius_converter

"""MoebiusConverter class for computing exact Shapley Interactions from Möbius coefficients."""

from __future__ import annotations

import copy
from typing import Any, Literal, get_args

import numpy as np
from scipy.special import binom

from shapiq.interaction_values import InteractionValues
from shapiq.utils.sets import powerset

ValidMoebiusConverterIndices = Literal["k-SII", "STII", "FSII", "FBII", "SII", "SV", "BV"]



[docs]
class MoebiusConverter:
    """Computes a variety of game-theoretic concepts exactly from Möbius coefficients.

    The MöbiusConverter class is used to compute various game-theoretic concepts like Shapley
    values, Shapley interactions, Banzhaf interactions, and many more from a collection of Möbius
    coefficients (also called Möbius Interactions, MI) of a game. The MoebiusConverter is built
    with the idea that some games

    Computes exact Shapley Interactions using the (sparse) Möbius representation.
    This is much faster than exact computation, if Möbius representation is sparse.

    Attributes:
        n: The number of players.
        moebius_coefficients: The InteractionValues object containing all non-zero (sparse) Möbius
            coefficients.

    """

    valid_indices: tuple[ValidMoebiusConverterIndices] = tuple(
        get_args(ValidMoebiusConverterIndices)
    )

    def __init__(self, moebius_coefficients: InteractionValues) -> None:
        """Initialize the MoebiusConverter.

        Args:
            moebius_coefficients: An InteractionValues object containing the (potentially sparse)
                Möbius coefficients.
        """
        self.moebius_coefficients: InteractionValues = moebius_coefficients
        self.n = self.moebius_coefficients.n_players
        # will store all computations
        self._computed: dict[tuple[ValidMoebiusConverterIndices, int], InteractionValues] = {}


[docs]
    def __call__(
        self, index: ValidMoebiusConverterIndices, order: int | None = None
    ) -> InteractionValues:
        """Calls the MoebiusConverter of the specified index or value.

        Args:
            index: The index or value to compute
            order: The order of the interaction index. If not specified the maximum order
                (i.e. ``n_players``) is used. Defaults to ``None``.

        Returns:
            The desired interaction values or generalized values.

        Raises:
            ValueError: If the index is not supported.

        """
        # sanitize input
        if order is None:
            order = self.n

        if (index, order) in self._computed:  # if index is already computed, return it
            return copy.deepcopy(self._computed[(index, order)])
        if index in self.valid_indices:  # if index is supported, compute it
            computed_index: InteractionValues = self.compute(index=index, order=order)
            self._computed[(index, order)] = computed_index
            return copy.deepcopy(computed_index)
        msg = f"Index {index} not supported."
        raise ValueError(msg)


    @staticmethod
    def _base_aggregation(base_interactions: InteractionValues, order: int) -> InteractionValues:
        """Transform Base Interactions into Interactions satisfying efficiency, e.g. SII to k-SII.

        Args:
            base_interactions: InteractionValues object containing interactions up to order ``order``.
            order: The highest order of interactions considered

        Returns:
            InteractionValues object containing transformed base_interactions

        """
        from .aggregation import aggregate_base_interaction

        aggregated_interactions = aggregate_base_interaction(base_interactions, order)
        return copy.copy(aggregated_interactions)


[docs]
    def compute(self, index: ValidMoebiusConverterIndices, order: int) -> InteractionValues:
        """Compute the interaction values for the given index and order.

        Args:
            index: The index or value to compute
            order: The order of the interaction index.

        Returns:
            The desired interaction values or generalized values.

        """
        match index:
            case "SV":
                return self._moebius_to_base_interaction(index="SV", order=1)
            case "BV":
                return self._fii_routine(index="FBII", order=1)
            case "k-SII":
                return self._moebius_to_k_sii(order=order)
            case "STII":
                return self._stii_routine(order=order)
            case "SII":
                return self._moebius_to_base_interaction(index="SII", order=order)
            case "FBII":
                return self._fii_routine(index="FBII", order=order)
            case "FSII":
                return self._fii_routine(index="FSII", order=order)
            case _:
                msg = (
                    f"Invalid index. Index `{index}` is not supported. "
                    f"Supported indices are: {self.valid_indices}."
                )
                raise ValueError(msg)


    def _moebius_to_base_interaction(
        self, index: Literal["SII", "SV"], order: int
    ) -> InteractionValues:
        """Computes a base interaction index, e.g. SII or BII.

        Args:
            order: The order of the explanation
            index: The base interaction index, e.g. SII, BII

        Returns:
            An InteractionValues object containing the base interactions

        """
        index_to_change_back = index
        if index == "SV":
            index = "SII"
        base_interaction_dict = {}
        # Pre-compute weights
        distribution_weights = np.zeros((self.n + 1, order + 1))
        for moebius_size in range(1, self.n + 1):
            for interaction_size in range(1, min(order, moebius_size) + 1):
                distribution_weights[moebius_size, interaction_size] = (
                    _get_moebius_distribution_weight(moebius_size, interaction_size, order, index)
                )

        for moebius_set, moebius_val in zip(
            self.moebius_coefficients.interaction_lookup,
            self.moebius_coefficients.values,
            strict=False,
        ):
            moebius_size = len(moebius_set)
            for interaction in powerset(moebius_set, min_size=0, max_size=order):
                val_distributed = distribution_weights[moebius_size, len(interaction)]
                # Check if Möbius value is distributed onto this interaction
                moebius_val_calc = moebius_val * val_distributed
                if moebius_val_calc == 0:
                    continue
                base_interaction_dict[interaction] = (
                    base_interaction_dict.get(interaction, 0) + moebius_val_calc
                )
                if base_interaction_dict[interaction] == 0:
                    base_interaction_dict.pop(interaction)

        base_interaction_values = np.zeros(len(base_interaction_dict))
        base_interaction_lookup = {}

        for i, interaction in enumerate(base_interaction_dict):
            base_interaction_values[i] = base_interaction_dict[interaction]
            base_interaction_lookup[interaction] = i

        index = index_to_change_back

        return InteractionValues(
            values=base_interaction_values,
            interaction_lookup=base_interaction_lookup,
            index=index,
            min_order=1,
            max_order=order,
            n_players=self.n,
            baseline_value=self.moebius_coefficients[()],
            estimation_budget=self.moebius_coefficients.estimation_budget,
            estimated=self.moebius_coefficients.estimated,
        )

    def _stii_routine(
        self,
        order: int,
        **kwargs: Any,  # noqa: ARG002
    ) -> InteractionValues:
        """Computes STII. Routine to distribute the Moebius coefficients onto all STII interactions.

        The lower-order interactions are equal to their Moebius coefficients, whereas the top-order
        interactions contain the distributed higher-order interactions.

        Args:
            order: The order of the explanation
            **kwargs: Additional keyword arguments are not used.

        Returns:
            An InteractionValues object containing the STII interactions.

        """
        stii_dict = {}

        # Pre-compute weights
        distribution_weights = np.zeros((self.n + 1, order + 1))

        stii_dict[()] = self.moebius_coefficients[()]

        for moebius_size in range(1, self.n + 1):
            for interaction_size in range(1, min(order, moebius_size) + 1):
                distribution_weights[moebius_size, interaction_size] = (
                    _get_moebius_distribution_weight(moebius_size, interaction_size, order, "STII")
                )

        for moebius_set, moebius_val in zip(
            self.moebius_coefficients.interaction_lookup,
            self.moebius_coefficients.values,
            strict=False,
        ):
            moebius_size = len(moebius_set)
            if moebius_size < order:
                # For STII, interaction below size order are the Möbius coefficients
                val_distributed = distribution_weights[moebius_size, moebius_size]
                moebius_val_calc = moebius_val * val_distributed
                if moebius_val_calc == 0:
                    continue
                stii_dict[moebius_set] = stii_dict.get(moebius_set, 0) + moebius_val_calc
                # if Möbius values sum up to zero, we pop it from the dict
                if stii_dict[moebius_set] == 0:
                    stii_dict.pop(moebius_set)
            else:
                # higher-order Möbius sets (size > order) distribute to all top-order interactions
                for interaction in powerset(moebius_set, min_size=order, max_size=order):
                    val_distributed = distribution_weights[moebius_size, len(interaction)]
                    # Check if Möbius value is distributed onto this interaction
                    moebius_val_calc = moebius_val * val_distributed
                    if moebius_val_calc == 0:
                        continue
                    stii_dict[interaction] = stii_dict.get(interaction, 0) + moebius_val_calc
                    if stii_dict[interaction] == 0:
                        stii_dict.pop(interaction)

        stii_values = np.zeros(len(stii_dict))
        stii_lookup = {}

        for i, interaction in enumerate(stii_dict):
            stii_values[i] = stii_dict[interaction]
            stii_lookup[interaction] = i

        return InteractionValues(
            values=stii_values,
            interaction_lookup=stii_lookup,
            index="STII",
            min_order=0,
            max_order=order,
            n_players=self.n,
            baseline_value=self.moebius_coefficients[()],
        )

    def _fii_routine(self, index: Literal["FSII", "FBII"], order: int) -> InteractionValues:
        """Computes FII. Routine to distribute the Moebius coefficients onto all FSII interactions.

        The higher-order interactions (``size > order``) are distributed onto all FSII interactions
        (``size <= order``).

        Args:
            index: The interaction index, e.g. FSII or FBII
            order: The order of the explanation

        Returns:
            An InteractionValues object containing the FSII interactions

        """
        fii_dict = {}
        # Pre-compute weights
        distribution_weights = np.zeros((self.n + 1, order + 1))
        for moebius_size in range(self.n + 1):
            for interaction_size in range(min(order, moebius_size) + 1):
                distribution_weights[moebius_size, interaction_size] = (
                    _get_moebius_distribution_weight(moebius_size, interaction_size, order, index)
                )

        # Handle empty set / baseline values differently for FSII and FBII
        if index == "FSII":
            # Set empty set
            fii_dict[()] = self.moebius_coefficients[()]
        if index == "FBII":
            # Add empty set for FBII via Möbius coefficients
            fii_dict[()] = self.moebius_coefficients[()]
            for moebius_set, moebius_val in zip(
                self.moebius_coefficients.interaction_lookup,
                self.moebius_coefficients.values,
                strict=False,
            ):
                moebius_size = len(moebius_set)
                if moebius_size > order:
                    fii_dict[()] += (-1) ** (order) * (
                        (1 / 2) ** moebius_size * binom(moebius_size - 1, order) * moebius_val
                    )

        # Distribute Moebius coefficients
        for moebius_set, moebius_val in zip(
            self.moebius_coefficients.interaction_lookup,
            self.moebius_coefficients.values,
            strict=False,
        ):
            moebius_size = len(moebius_set)
            # For higher-order Moebius sets (size > order) distribute the value among all
            # contained interactions
            for interaction in powerset(moebius_set, min_size=1, max_size=order):
                val_distributed = distribution_weights[moebius_size, len(interaction)]
                # Check if Möbius value is distributed onto this interaction
                moebius_val_calc = moebius_val * val_distributed
                if moebius_val_calc == 0:
                    continue
                fii_dict[interaction] = fii_dict.get(interaction, 0) + moebius_val_calc
                # if Möbius values sum up to zero, we pop it from the dict
                if fii_dict[interaction] == 0:
                    fii_dict.pop(interaction)

        fii_values = np.zeros(len(fii_dict))
        fii_lookup = {}
        for i, interaction in enumerate(fii_dict):
            fii_values[i] = fii_dict[interaction]
            fii_lookup[interaction] = i

        return InteractionValues(
            values=fii_values,
            interaction_lookup=fii_lookup,
            index=index,
            min_order=0,
            max_order=order,
            n_players=self.n,
            baseline_value=fii_dict[()],
        )

    def _moebius_to_k_sii(
        self,
        order: int,
    ) -> InteractionValues:
        """Computes k-SII from Möbius coefficients.

        This method computes the k-Shapley Interaction Index (k-SII) from the Möbius coefficients by
        first computing the SII and then aggregating the values to k-SII.

        Args:
            order: The order of the explanation.

        Returns:
            An InteractionValues object containing the k-SII interactions.

        """
        sii = self._moebius_to_base_interaction(order=order, index="SII")
        self._computed[("SII", order)] = sii
        k_sii = self._base_aggregation(
            base_interactions=sii,
            order=order,
        )
        self._computed[("k-SII", order)] = k_sii
        return copy.copy(k_sii)



def _get_moebius_distribution_weight(
    moebius_size: int,
    interaction_size: int,
    order: int,
    index: Literal["SII", "STII", "FSII", "FBII"],
) -> float:
    """Return the distribution weights for the Möbius coefficients onto the lower-order interaction indices.

    Args:
        moebius_size: The size of the Möbius coefficient.
        interaction_size: The size of the interaction.
        order: The order of the explanation.
        index: The interaction index.

    Returns:
        A distribution weight for the given combination.

    Raises:
        ValueError: If the index is not supported.

    """
    if index == "SII":
        return _sii_distribution_weight(moebius_size, interaction_size)
    if index == "STII":
        return _stii_distribution_weight(moebius_size, interaction_size, order)
    if index == "FSII":
        return _fsii_distribution_weight(moebius_size, interaction_size, order)
    if index == "FBII":
        return _fbii_distribution_weight(moebius_size, interaction_size, order)
    msg = f"Index {index} not supported."
    raise ValueError(msg)


def _sii_distribution_weight(moebius_size: int, interaction_size: int) -> float:
    """Return the distribution weight for SII."""
    return 1 / (moebius_size - interaction_size + 1)


def _stii_distribution_weight(moebius_size: int, interaction_size: int, order: int) -> float:
    """Return the distribution weight for STII."""
    if moebius_size <= order:
        if moebius_size == interaction_size:
            return 1
        return 0
    if interaction_size == order:
        return 1 / binom(moebius_size, moebius_size - interaction_size)
    return 0


def _fsii_distribution_weight(moebius_size: int, interaction_size: int, order: int) -> float:
    """Return the distribution weight for FSII."""
    if moebius_size <= order:
        if moebius_size == interaction_size:
            return 1
        return 0
    return (
        (-1) ** (order - interaction_size)
        * (interaction_size / (order + interaction_size))
        * (
            binom(order, interaction_size)
            * binom(moebius_size - 1, order)
            / binom(moebius_size + order - 1, order + interaction_size)
        )
    )


def _fbii_distribution_weight(moebius_size: int, interaction_size: int, order: int) -> float:
    """Return the distribution weight for FBII."""
    if moebius_size <= order:
        if moebius_size == interaction_size:
            return 1
        return 0
    return (
        (-1) ** (order - interaction_size)
        * (1 / 2) ** (moebius_size - interaction_size)
        * binom(moebius_size - interaction_size - 1, order - interaction_size)
    )