Source code for nash.algorithms.support_enumeration

"""A class for a normal form game"""
import numpy as np
from itertools import chain, combinations


[docs]def powerset(n):
    """
    A power set of range(n)

    Based on recipe from python itertools documentation:

    https://docs.python.org/2/library/itertools.html#recipes
    """
    return chain.from_iterable(combinations(range(n), r) for r in range(n + 1))


[docs]def solve_indifference(A, rows=None, columns=None):
    """
    Solve the indifference for a payoff matrix assuming support for the
    strategies given by columns

    Finds vector of probabilities that makes player indifferent between
    rows.  (So finds probability vector for corresponding column player)

    Parameters
    ----------

        A: a 2 dimensional numpy array (A payoff matrix for the row player)
        rows: the support played by the row player
        columns: the support player by the column player

    Returns
    -------

        A numpy array:
        A probability vector for the column player that makes the row
        player indifferent. Will return False if all entries are not >= 0.
    """
    # Ensure differences between pairs of pure strategies are the same
    M = (A[np.array(rows)] - np.roll(A[np.array(rows)], 1, axis=0))[:-1]

    # Columns that must be played with prob 0
    zero_columns = set(range(A.shape[1])) - set(columns)

    if zero_columns != set():
        M = np.append(M, [[int(i == j) for i, col in enumerate(M.T)]
                          for j in zero_columns], axis=0)

    # Ensure have probability vector
    M = np.append(M, np.ones((1, M.shape[1])), axis=0)
    b = np.append(np.zeros(len(M) - 1), [1])

    try:
        prob = np.linalg.solve(M, b)
        if all(prob >= 0):
            return prob
        return False
    except np.linalg.linalg.LinAlgError:
        return False

[docs]def potential_support_pairs(A, B):
    """
    A generator for the potential support pairs

    Returns
    -------

        A generator of all potential support pairs
    """
    p1_num_strategies, p2_num_strategies = A.shape
    for support1 in (s for s in powerset(p1_num_strategies) if len(s) > 0):
        for support2 in (s for s in powerset(p2_num_strategies)
                         if len(s) == len(support1)):
            yield support1, support2

[docs]def indifference_strategies(A, B):
    """
    A generator for the strategies corresponding to the potential supports

    Returns
    -------

        A generator of all potential strategies that are indifferent on each
        potential support. Return False if they are not valid (not a
        probability vector OR not fully on the given support).
    """
    for pair in potential_support_pairs(A, B):
        s1 = solve_indifference(B.T, *(pair[::-1]))
        s2 = solve_indifference(A, *pair)

        if obey_support(s1, pair[0]) and obey_support(s2, pair[1]):
            yield s1, s2, pair[0], pair[1]

[docs]def obey_support(strategy, support):
    """
    Test if a strategy obeys its support

    Parameters
    ----------

        strategy: a numpy array
            A given strategy vector
        support: a numpy array
            A strategy support

    Returns
    -------

        A boolean: whether or not that strategy does indeed have the given
        support
    """
    if strategy is False:
        return False
    if not all((i in support and value > 0) or
               (i not in support and value <= 0)
               for i, value in enumerate(strategy)):
        return False
    return True

[docs]def is_ne(strategy_pair, support_pair, payoff_matrices):
    """
    Test if a given strategy pair is a pair of best responses

    Parameters
    ----------

        strategy_pair: a 2-tuple of numpy arrays
        support_pair: a 2-tuple of numpy arrays
    """
    A, B = payoff_matrices
    # Payoff against opponents strategies:
    u = strategy_pair[1].reshape(strategy_pair[1].size, 1)
    row_payoffs = np.dot(A, u)

    v = strategy_pair[0].reshape(strategy_pair[0].size, 1)
    column_payoffs = np.dot(B.T, v)

    # Pure payoffs on current support:
    row_support_payoffs = row_payoffs[np.array(support_pair[0])]
    column_support_payoffs = column_payoffs[np.array(support_pair[1])]

    return (row_payoffs.max() == row_support_payoffs.max() and
            column_payoffs.max() == column_support_payoffs.max())

[docs]def support_enumeration(A, B):
    """
    Obtain the Nash equilibria using support enumeration.

    Algorithm implemented here is Algorithm 3.4 of [Nisan2007]_

    1. For each k in 1...min(size of strategy sets)
    2. For each I,J supports of size k
    3. Solve indifference conditions
    4. Check that have Nash Equilibrium.

    Returns
    -------

        equilibria: A generator.
    """
    return ((s1, s2)
            for s1, s2, sup1, sup2 in indifference_strategies(A, B)
            if is_ne((s1, s2), (sup1, sup2), (A, B)))