Source code for pref_voting.generate_weighted_majority_graphs

'''
    File: generate_margin_graphs.py
    Author: Wes Holliday (wesholliday@berkeley.edu) and Eric Pacuit (epacuit@umd.edu)
    Date: July 14, 2022
    Updated: December 19, 2022
    
    Functions to generate a margin graph
    
'''


import networkx as nx
from itertools import combinations
from pref_voting.weighted_majority_graphs import MarginGraph
import numpy as np
from scipy.stats import multivariate_normal

[docs] def generate_edge_ordered_tournament(num_cands, parity="even"): """Generate a random uniquely weighted MarginGraph for ``num_cands`` candidates. :param num_cands: the number of candidates :type num_cands: int :returns: a uniquely weighted margin graph :rtype: MarginGraph .. note:: This function randomly generates a tournament with a linear order over the edges. A **tournament** is an asymmetric directed graph with an edge between every two nodes. The linear order of the edges is represented by assigning to each edge a number :math:`2, \ldots, 2*n`, where :math:`n` is the number of the edges. """ assert parity in ["even", "odd"], "The parity should be either 'even' or 'odd'." mg = nx.DiGraph() mg.add_nodes_from(list(range(num_cands))) candidates = list(range(num_cands)) _edges = list() for c1 in candidates: for c2 in candidates: if c1 != c2: if (c1, c2) not in _edges and (c2, c1) not in _edges: if np.random.choice([True, False]): _edges.append((c1, c2)) else: _edges.append((c2, c1)) edges = list() edge_indices = list(range(len(_edges))) np.random.shuffle(edge_indices) for i, e_idx in enumerate(edge_indices): edges.append((_edges[e_idx][0], _edges[e_idx][1], 2 * (i+1) if parity == 'even' else 2 * i+1)) return MarginGraph(candidates, edges)
[docs] def generate_margin_graph(num_cands, weight_domain = None, parity = 'even'): """Generate a random MarginGraph (allowing for ties in the margins) for ``num_cands`` candidates. Args: num_cands (int): the number of candidates Returns: MarginGraph """ assert parity in ['even', 'odd'], "Parity must be 'even' or 'odd'." assert weight_domain is None or isinstance(weight_domain, list) and len(weight_domain) > 0, "The weight_domain must be a list with at least one element." candidates = list(range(num_cands)) edges = list() pairs_of_cands = list(combinations(candidates, 2)) if weight_domain is None and parity == 'even': weight_domain = [2 * pidx for pidx in range(len(pairs_of_cands) + 1)] elif weight_domain is None and parity == 'odd': weight_domain = [2 * pidx + 1 for pidx in range(len(pairs_of_cands) + 1)] # for c1, c2 in pairs_of_cands: margin = np.random.choice(weight_domain) if margin != 0: if np.random.choice([True, False]): edges.append((c1, c2, margin)) else: edges.append((c2, c1, margin)) return MarginGraph(candidates, edges)
[docs] def generate_margin_graph_bradley_terry(num_cands, num_voters, score_prob_mod = lambda c: np.random.uniform(0,1)): """Generates a margin graph for num_cands candidates by first sampling candidate scores from score_prob_mod and then sampling votes from the Bradley-Terry model using the sampled scores. Args: num_cands (int): Number of candidates num_voters (int): Number of voters score_prob_mod (function, optional): A function that takes a candidate and returns a score. Defaults to lambda c: np.random.uniform(0,1). Returns: MarginGraph: A margin graph """ candidates = list(range(num_cands)) pairs_of_cands = list(combinations(candidates, 2)) cand_score = dict() for c in candidates: cand_score[c] = score_prob_mod(c) edges = list() for c1, c2 in pairs_of_cands: support_c1_c2 = 0 support_c2_c1 = 0 for n in range(num_voters): vote = np.random.choice([1,0], p = [cand_score[c1] / (cand_score[c1] + cand_score[c2]), cand_score[c2] / (cand_score[c1] + cand_score[c2])]) if vote == 1: support_c1_c2 += 1 else: support_c2_c1 += 1 if support_c1_c2 > support_c2_c1: edges.append((c1,c2, support_c1_c2 - support_c2_c1)) if support_c2_c1 > support_c1_c2: edges.append((c2,c1, support_c2_c1 - support_c1_c2)) return MarginGraph(candidates, edges)
### # Turn a code into a pair def depair(pair_vector, k): return pair_vector[k] # This function defines the i,jth entry of the covariance matrix def entries(pair_vector, i,j): x = depair(pair_vector, i) y = depair(pair_vector, j) if x[0] == y[0] and x[1] == y[1]: return 1 if x[1] == y[0]: return -1/3 if x[1] == y[1]: return 1/3 if x[0] == y[0]: return 1/3 if x[0] == y[1]: return -1/3 return 0 def generate_covariance_matrix(num_candidates): num_pairs = num_candidates *(num_candidates -1)//2 # Store the vector mapping codes to pairs pair_vector = [0]*num_pairs # Populate the vector of pairs k=0 for i in range(num_candidates): for j in range(i+1,num_candidates): pair_vector[k] = [i,j] k = k+1 # Populate the covariance matrix cov = np.empty((num_pairs,num_pairs)) for i in range(num_pairs): for j in range(num_pairs): cov[i,j] = entries(pair_vector, i,j) return cov
[docs] def generate_edge_ordered_tournament_infinite_limit(num_candidates, cov_matrix = None): """ Using the ideas from Section 9 of the paper *An Analysis of Random Elections with Large Numbers of Voters* by Matthew Harrison-Trainor (https://arxiv.org/abs/2009.02979) and the code provided at https://github.com/MatthewHT/RandomMarginGraphs/, generate a qualitative margin graph for ``num_candidates`` candidates. .. important:: The weights of the generated margin graphs are real numbers, representing a linear ordering of the edges. Only qualitative margin graph invariant voting methods, such as Split Cycle, Beat Path, Minimax, Ranked Pairs, etc., should be used on the generated graphs. Args: num_candidates (int): the number of candidates Returns: MarginGraph """ candidates = range(num_candidates) cov_matrix = cov_matrix if cov_matrix is not None else generate_covariance_matrix(num_candidates) # random_var is a random variable with the multivariate normal distribution of margin graphs random_var = multivariate_normal(None, cov_matrix) rv = random_var.rvs() def pair(p): return p[1]-2*p[0]-1 + (num_candidates)*(num_candidates+1)//2 - (num_candidates-p[0])*(num_candidates-p[0]+1)//2 mg = [[-np.inf for _ in candidates] for _ in candidates] for c1 in candidates: for c2 in candidates: if (c1 < c2 and rv[pair([c1,c2])] > 0): mg[c1][c2] = rv[pair([c1,c2])] if (c1 > c2 and rv[pair([c2,c1])] < 0): mg[c1][c2] = -rv[pair([c2,c1])] if (c1 == c2): mg[c1][c2] = 0 w_edges = [(c1, c2, mg[c1][c2]) for c1 in candidates for c2 in candidates if c1 != c2 if mg[c1][c2] > 0] return MarginGraph(candidates, w_edges)
## Generating Canonical MarginGraphs def _enumerate_ceots(num_cands, num_edges, partial_ceot, used_nodes, next_node): # Given a partial ceot P, we can extend it with any new edge (A,B) satisfying one of the following conditions: # 1. A and B have both already been used in edges in P, but neither (A,B) nor (B,A) is in P; # 2. A has already been used in an edge in P, and B is the next integer after the largest integer in an edge in P. # 3. A is the next integer after the largest integer in an edge in P, and B has already been used in an edge in P; # 4. A is the next integer after the largest integer in an edge in P, and B is the next integer after A. if len(partial_ceot) == num_edges: yield partial_ceot if len(partial_ceot) < num_edges: if next_node == num_cands: available_nodes = used_nodes if next_node < num_cands: available_nodes = used_nodes + [next_node] for n in available_nodes: if n == next_node and next_node < num_cands - 1: # If n == next_node, we are in Case 3 or Case 4 above available_nodes = used_nodes + [next_node + 1] for m in available_nodes: if not n==m and not (n,m) in partial_ceot and not (m,n) in partial_ceot: new_ceot = [edge for edge in partial_ceot] + [(n,m)] if not (n == next_node or m == next_node): # Then we are in Case 1 above yield from _enumerate_ceots(num_cands,num_edges,new_ceot,used_nodes,next_node) if (n == next_node or m == next_node) and not m == next_node + 1: # Then we are in Case 2 or 3 above new_used_nodes = list(set(used_nodes + [n,m])) new_next_node = next_node + 1 yield from _enumerate_ceots(num_cands,num_edges,new_ceot,new_used_nodes,new_next_node) if m == next_node + 1: # Then we are in Case 4 above new_used_nodes = list(set(used_nodes + [n,m])) new_next_node = next_node + 2 yield from _enumerate_ceots(num_cands,num_edges,new_ceot,new_used_nodes,new_next_node) def _enumerate_ceots_as_edgelist(num_cands): num_edges = (num_cands * (num_cands -1))//2 partial_ceot = [(0,1)] used_nodes = [0,1] next_node = 2 yield from _enumerate_ceots(num_cands,num_edges,partial_ceot,used_nodes,next_node)
[docs] def enumerate_canonical_edge_ordered_tournaments(num_cands, parity = "even"): """ A *canonical* edge-ordered tournament (ceot) is a representative from an isomorphism class of linearly edge-ordered tournaments. Enumerate all ceots for ``num_cands`` candidates, representing a ceot as a ``MarginGraph`` where the margins represent the linear order of the edges. Args: num_cands (int): the number of candidates parity (str, optional): The parity of the margins, either 'even' or 'odd'. Returns: A generator of ``MarginGraph`` for ``num_candidates`` .. warning:: It is only feasible to run this function for up to 5 candidates. """ assert parity in ["odd", "even"], "parity must be either 'odd' or 'even'" for ceot in _enumerate_ceots_as_edgelist(num_cands): yield MarginGraph(list(range(num_cands)), [(e[0], e[1], 2 * (eidx + 1) if parity == "even" else 2 * eidx + 1) for eidx, e in enumerate(reversed(ceot))])
def sublists(lst, length, x = None, partial_sublist = None): x = length if x is None else x partial_sublist = list() if partial_sublist is None else partial_sublist if len(partial_sublist) == length: yield partial_sublist for i,el in enumerate(lst): if i < x: extended_partial_sublist = partial_sublist + [el] x += 1 yield from sublists(lst[i+1::], length, x, extended_partial_sublist)
[docs] def enumerate_uniquely_weighted_margin_graphs(num_cands, weight_domain): """ Enumerate all representatives from isomorphism classes of margin graphs with weights drawn from ``weight_domain``. Args: num_cands (int): the number of candidates weight_domain (List[int]): The list of weights in the margin graph. Returns: A generator of ``MarginGraph`` for ``num_candidates`` .. warning:: It is only feasible to run this function for up to 5 candidates. """ weight_domain = sorted(weight_domain) num_edges = (num_cands * (num_cands - 1)) // 2 for ceot in _enumerate_ceots_as_edgelist(num_cands): for weight_list in sublists(weight_domain, num_edges): yield MarginGraph(list(range(num_cands)), [(e[0], e[1], weight_list[eidx]) for eidx, e in enumerate(reversed(ceot))])