111 lines
3.4 KiB
Python
111 lines
3.4 KiB
Python
"""Node redundancy for bipartite graphs."""
|
|
from itertools import combinations
|
|
|
|
from networkx import NetworkXError
|
|
|
|
__all__ = ["node_redundancy"]
|
|
|
|
|
|
def node_redundancy(G, nodes=None):
|
|
r"""Computes the node redundancy coefficients for the nodes in the bipartite
|
|
graph `G`.
|
|
|
|
The redundancy coefficient of a node `v` is the fraction of pairs of
|
|
neighbors of `v` that are both linked to other nodes. In a one-mode
|
|
projection these nodes would be linked together even if `v` were
|
|
not there.
|
|
|
|
More formally, for any vertex `v`, the *redundancy coefficient of `v`* is
|
|
defined by
|
|
|
|
.. math::
|
|
|
|
rc(v) = \frac{|\{\{u, w\} \subseteq N(v),
|
|
\: \exists v' \neq v,\: (v',u) \in E\:
|
|
\mathrm{and}\: (v',w) \in E\}|}{ \frac{|N(v)|(|N(v)|-1)}{2}},
|
|
|
|
where `N(v)` is the set of neighbors of `v` in `G`.
|
|
|
|
Parameters
|
|
----------
|
|
G : graph
|
|
A bipartite graph
|
|
|
|
nodes : list or iterable (optional)
|
|
Compute redundancy for these nodes. The default is all nodes in G.
|
|
|
|
Returns
|
|
-------
|
|
redundancy : dictionary
|
|
A dictionary keyed by node with the node redundancy value.
|
|
|
|
Examples
|
|
--------
|
|
Compute the redundancy coefficient of each node in a graph::
|
|
|
|
>>> from networkx.algorithms import bipartite
|
|
>>> G = nx.cycle_graph(4)
|
|
>>> rc = bipartite.node_redundancy(G)
|
|
>>> rc[0]
|
|
1.0
|
|
|
|
Compute the average redundancy for the graph::
|
|
|
|
>>> from networkx.algorithms import bipartite
|
|
>>> G = nx.cycle_graph(4)
|
|
>>> rc = bipartite.node_redundancy(G)
|
|
>>> sum(rc.values()) / len(G)
|
|
1.0
|
|
|
|
Compute the average redundancy for a set of nodes::
|
|
|
|
>>> from networkx.algorithms import bipartite
|
|
>>> G = nx.cycle_graph(4)
|
|
>>> rc = bipartite.node_redundancy(G)
|
|
>>> nodes = [0, 2]
|
|
>>> sum(rc[n] for n in nodes) / len(nodes)
|
|
1.0
|
|
|
|
Raises
|
|
------
|
|
NetworkXError
|
|
If any of the nodes in the graph (or in `nodes`, if specified) has
|
|
(out-)degree less than two (which would result in division by zero,
|
|
according to the definition of the redundancy coefficient).
|
|
|
|
References
|
|
----------
|
|
.. [1] Latapy, Matthieu, Clémence Magnien, and Nathalie Del Vecchio (2008).
|
|
Basic notions for the analysis of large two-mode networks.
|
|
Social Networks 30(1), 31--48.
|
|
|
|
"""
|
|
if nodes is None:
|
|
nodes = G
|
|
if any(len(G[v]) < 2 for v in nodes):
|
|
raise NetworkXError(
|
|
"Cannot compute redundancy coefficient for a node"
|
|
" that has fewer than two neighbors."
|
|
)
|
|
# TODO This can be trivially parallelized.
|
|
return {v: _node_redundancy(G, v) for v in nodes}
|
|
|
|
|
|
def _node_redundancy(G, v):
|
|
"""Returns the redundancy of the node `v` in the bipartite graph `G`.
|
|
|
|
If `G` is a graph with `n` nodes, the redundancy of a node is the ratio
|
|
of the "overlap" of `v` to the maximum possible overlap of `v`
|
|
according to its degree. The overlap of `v` is the number of pairs of
|
|
neighbors that have mutual neighbors themselves, other than `v`.
|
|
|
|
`v` must have at least two neighbors in `G`.
|
|
|
|
"""
|
|
n = len(G[v])
|
|
# TODO On Python 3, we could just use `G[u].keys() & G[w].keys()` instead
|
|
# of instantiating the entire sets.
|
|
overlap = sum(
|
|
1 for (u, w) in combinations(G[v], 2) if (set(G[u]) & set(G[w])) - {v}
|
|
)
|
|
return (2 * overlap) / (n * (n - 1))
|