123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109 |
- """Node redundancy for bipartite graphs."""
- from itertools import combinations
- from networkx import NetworkXError
- __all__ = ["node_redundancy"]
- def node_redundancy(G, nodes=None):
- r"""Computes the node redundancy coefficients for the nodes in the bipartite
- graph `G`.
- The redundancy coefficient of a node `v` is the fraction of pairs of
- neighbors of `v` that are both linked to other nodes. In a one-mode
- projection these nodes would be linked together even if `v` were
- not there.
- More formally, for any vertex `v`, the *redundancy coefficient of `v`* is
- defined by
- .. math::
- rc(v) = \frac{|\{\{u, w\} \subseteq N(v),
- \: \exists v' \neq v,\: (v',u) \in E\:
- \mathrm{and}\: (v',w) \in E\}|}{ \frac{|N(v)|(|N(v)|-1)}{2}},
- where `N(v)` is the set of neighbors of `v` in `G`.
- Parameters
- ----------
- G : graph
- A bipartite graph
- nodes : list or iterable (optional)
- Compute redundancy for these nodes. The default is all nodes in G.
- Returns
- -------
- redundancy : dictionary
- A dictionary keyed by node with the node redundancy value.
- Examples
- --------
- Compute the redundancy coefficient of each node in a graph::
- >>> from networkx.algorithms import bipartite
- >>> G = nx.cycle_graph(4)
- >>> rc = bipartite.node_redundancy(G)
- >>> rc[0]
- 1.0
- Compute the average redundancy for the graph::
- >>> from networkx.algorithms import bipartite
- >>> G = nx.cycle_graph(4)
- >>> rc = bipartite.node_redundancy(G)
- >>> sum(rc.values()) / len(G)
- 1.0
- Compute the average redundancy for a set of nodes::
- >>> from networkx.algorithms import bipartite
- >>> G = nx.cycle_graph(4)
- >>> rc = bipartite.node_redundancy(G)
- >>> nodes = [0, 2]
- >>> sum(rc[n] for n in nodes) / len(nodes)
- 1.0
- Raises
- ------
- NetworkXError
- If any of the nodes in the graph (or in `nodes`, if specified) has
- (out-)degree less than two (which would result in division by zero,
- according to the definition of the redundancy coefficient).
- References
- ----------
- .. [1] Latapy, Matthieu, Clémence Magnien, and Nathalie Del Vecchio (2008).
- Basic notions for the analysis of large two-mode networks.
- Social Networks 30(1), 31--48.
- """
- if nodes is None:
- nodes = G
- if any(len(G[v]) < 2 for v in nodes):
- raise NetworkXError(
- "Cannot compute redundancy coefficient for a node"
- " that has fewer than two neighbors."
- )
- # TODO This can be trivially parallelized.
- return {v: _node_redundancy(G, v) for v in nodes}
- def _node_redundancy(G, v):
- """Returns the redundancy of the node `v` in the bipartite graph `G`.
- If `G` is a graph with `n` nodes, the redundancy of a node is the ratio
- of the "overlap" of `v` to the maximum possible overlap of `v`
- according to its degree. The overlap of `v` is the number of pairs of
- neighbors that have mutual neighbors themselves, other than `v`.
- `v` must have at least two neighbors in `G`.
- """
- n = len(G[v])
- overlap = sum(
- 1 for (u, w) in combinations(G[v], 2) if (set(G[u]) & set(G[w])) - {v}
- )
- return (2 * overlap) / (n * (n - 1))
|