Source code for socialchoicekit.utils

import numpy as np
from typing import Dict, List, Union

[docs]def check_profile(
  profile: np.ndarray,
  is_complete: bool = True,
  is_strict: bool = True,
) -> None:
  """
  Checks that the profile is a numpy array with the correct dimensions.

  Parameters
  ----------
  profile: np.ndarray
    This is the ordinal profile. A (N, M) array, where N is the number of agents and M is the number of alternatives or items. The element at (i, j) indicates the agent's preference for alternative j, where 1 is the most preferred alternative.

  is_complete: bool
    If True, the profile does not have any NaN values. If False, the profile has NaN values. True by default.

  is_strict: bool
    If True, the profile does not allow ties. If False, the profile allows ties. True by default.

  Raises
  ------
  ValueError
    If the profile is not a numpy array
    If the profile is not two-dimensional.
    If the profile contains NaN values.
    If the profile contains values other than integers from 1 to M.
  """
  if isinstance(profile, np.ndarray):
    if np.ndim(profile) == 2:
      if is_complete and np.isnan(np.sum(profile)):
        raise ValueError("Profile cannot contain NaN values")
      if np.nanmin(profile) == 1:
        if not is_complete or not is_strict or np.nanmax(profile) == profile.shape[1]:
          return
      raise ValueError("Profile must contain exactly integers from 1 to M")
    raise ValueError("Profile must be a two-dimensional array")
  raise ValueError("Profile is not in a recognized data format")

[docs]def check_valuation_profile(
    valuation_profile: np.ndarray,
    is_complete: bool = False
  ) -> None:
  """
  Checks that the valuation profile is a numpy array with the correct dimensions.

  Parameters
  ----------
    valuation_profile: np.ndarray
      This is the (partial) cardinal profile. A (N, M) array, where N is the number of agents and M is the number of alternatives or items. The element at (i, j) indicates the utility value (agent's cardinal preference) for alternative or item j. If the value is unknown, the element would be NaN.

    is_complete: bool
      If True, the valuation profile does not have any NaN values. If False, the valuation profile has NaN values. False by default.
  """
  if isinstance(valuation_profile, np.ndarray):
    if np.ndim(valuation_profile) == 2:
      if is_complete and np.isnan(np.sum(valuation_profile)):
        raise ValueError("Valuation profile cannot contain NaN values")
      return
    raise ValueError("Profile must be a two-dimensional array")
  raise ValueError("Profile is not in a recognized data format")

[docs]def check_square_matrix(matrix: np.ndarray) -> None:
  """
  Checks that the matrix is a numpy array that represents a square matrix.

  Parameters
  ----------
  matrix: np.ndarray
    This is the matrix to check. An (M, M) array.

  Raises
  ------
  ValueError
    If the matrix is not a numpy array
    If the matrix is not two-dimensional.
    If the matrix is not square.
  """
  if isinstance(matrix, np.ndarray):
    if np.ndim(matrix) == 2:
      if matrix.shape[0] == matrix.shape[1]:
        return
      raise ValueError("Matrix must be square")
    raise ValueError("Matrix must be a two-dimensional array")
  raise ValueError("Matrix is not in a recognized data format")

[docs]def check_graph(G: Dict[int, List[int]]) -> None:
  """
  Checks that a dictionary represents a graph.

  Parameters
  ----------
  G : Dict[int, List[int]]
    A dictionary of the form {i: [j, k, ...]} where i is the index of a vertex and [j, k, ...] are the indices of the vertices that i is connected to.
    The graph may be directed or undirected.

  Raises
  ------
  ValueError
    If the graph is not a dictionary.
    If the graph is not two-dimensional.
    If the graph contains NaN values.
    If the graph contains values other than integers.
  """
  if isinstance(G, dict):
    if all(isinstance(i, int) for i in G.keys()):
      if all(isinstance(i, list) for i in G.values()):
        for l in G.values():
          if all([i in G.keys() for i in l]):
            return
          raise ValueError("Vertices can only be linked to other vertices")
      raise ValueError("Graph must contain lists as values")
    raise ValueError("Graph must contain integers as keys")
  raise ValueError("Graph is not in a recognized data format")

[docs]def check_bipartite_graph(G: Dict[int, List[int]], X: list, Y: list) -> None:
  """
  Checks that a dictionary represents a bipartite graph.

  Parameters
  ----------
  G : Dict[int, List[int]]
    A dictionary of the form {i: [j, k, ...]} where i is the index of a vertex and [j, k, ...] are the indices of the vertices that i is connected to.
    The graph may be directed or undirected. If it is directed, then the edges are assumed to be directed from X to Y.

  X: list
    The list of the left vertices (in the first partition) in the bipartite graph G.

  Y: list
    The list of the right vertices (in the second partition) in the bipartite graph G.

  Raises
  ------
  ValueError
    If the graph is not bipartite.
  """
  check_graph(G)
  if set(X + Y) == set(G.keys()):
    for e in X:
      if e in Y:
        raise ValueError("Graph is not bipartite")
      if all([y in Y for y in G[e]]):
        return
      raise ValueError("Graph is not bipartite")
    for e in Y:
      if all([x in X for x in G[e]]):
        return
      raise ValueError("Graph is not bipartite")
  raise ValueError("Supplied X and/or Y are not consistent with the keys of the dictionary")

[docs]def check_tie_breaker(
  tie_breaker: str,
  include_accept: bool = True
) -> None:
  """
  Checks that the tie breaker is valid.

  Parameters
  ----------
  tie_breaker : {"random", "first", "accept"}
    The tie breaker to check.
    - "random": pick from a uniform distribution among the losers to drop
    - "first": pick the alternative with the lowest index
    - "accept": return all winners in an array

  include_accept : bool
    If True, "accept" is a valid tie breaker. If False, "accept" is not a valid tie breaker.

  Raises
  ------
  ValueError
    If the tie breaker is not recognized.
  """
  if tie_breaker in ["random", "first"]:
    return
  if include_accept and tie_breaker in ["accept"]:
    return
  raise ValueError("Tie breaker is not recognized")

[docs]def break_tie(
  alternatives: np.ndarray,
  tie_breaker: str = "random",
  include_accept: bool = True
) -> Union[np.ndarray, int]:
  """
  Breaks a tie among winning alternatives according to the tie breaker.

  Parameters
  ----------
  alternatives : np.ndarray
    The alternatives that are tied.

  tie_breaker : {"random", "first", "accept"}
    The tie breaker to use.
    - "random": pick from a uniform distribution among the losers to drop
    - "first": pick the alternative with the lowest index
    - "accept": return all winners in an array

  include_accept : bool
    If True, "accept" is a valid tie breaker. If False, "accept" is not a valid tie breaker.
  """
  if tie_breaker == "random":
    return np.random.choice(alternatives)
  elif tie_breaker == "first":
    return alternatives[0]
  elif tie_breaker == "accept" and include_accept:
    return alternatives
  else:
    raise ValueError("Tie breaker is not recognized")