Module `olivia.immunization`

Olivia immunization functions.

Immunization analyzes in which packages it is better to invest to protect the network as a whole.

Expand source code

"""
Olivia immunization functions.

Immunization analyzes in which packages it is better to invest to protect the network as a whole.
"""

import random

import networkx as nx

from itertools import product

from olivia.lib.graphs import removed, strong_articulation_points
from olivia.model import OliviaNetwork
from olivia.networkmetrics import failure_vulnerability
from olivia.packagemetrics import Reach, DependentsCount, Impact, Surface


def immunization_delta(net, n, cost_metric=Reach, algorithm='network'):
    """
    Compute the improvement in network vulnerability by immunizing a certain set of packages.

    Parameters
    ----------
    net: OliviaNetwork
        Input network.
    n: container
        Container of packages to be immunized.
    cost_metric: class, optional
        Metric to measure cost.
    algorithm: 'network' or 'analytic'

    Returns
    -------
    result: float
        Difference of network vulnerability after immunization of the elements in n.

    Notes
    -----
    'network' algorithm Implements the naive algorithm of removing immunized nodes and rebuilding model from scratch,
    so it is slow for big networks. Some obvious improvements could be made, but whether or not there is a
    much better alternative is an open question.
    'analytic' algorithm uses only local information pertaining transitive relations of the elements to be
    immunized. This is faster for smaller networks and/or smaller immunization sets but slower otherwise. Only
    implemented for the Reach metric.

    """
    if algorithm == 'network':
        return _immunization_delta_network(net, n, cost_metric=cost_metric)
    elif algorithm == 'analytic' and cost_metric == Reach:
        return _immunization_delta_analytic(net, n)
    else:
        raise ValueError("Not implemented.")


def _immunization_delta_network(net, n, cost_metric=Reach):
    f1 = failure_vulnerability(net, metric=cost_metric)
    size_correction = (len(net.network) - len(n)) / len(net.network)
    with removed(net.network, n):
        immunized_net = OliviaNetwork()
        immunized_net.build_model(net.network)
        f2 = failure_vulnerability(immunized_net, metric=cost_metric)
    f2 = size_correction * f2
    return f1 - f2


def _immunization_delta_analytic(net, n):
    g = net.network
    shunt = set()
    a = set()
    d = set()
    s = set()
    for node in n:
        asc = nx.ancestors(g, node)
        a.update(asc)
        desc = nx.descendants(g, node)
        d.update(desc)
        s.update(set(product(asc | {node}, desc | {node})))
    a = a - set(n)
    d = d - set(n)
    with removed(g, n):
        for ancestor in a:
            desc = nx.descendants(g, ancestor) | {ancestor}
            shunt.update({(ancestor, f) for f in desc})
    return len(s - shunt) / len(g)


def iset_naive_ranking(set_size, ms, subset=None):
    """
    Compute an immunization set by selecting top elements according to a metric.

    Parameters
    ----------
    set_size: int
        Number of packages in the immunization set.
    ms: metricStats
        Metric to measure cost.
    subset: container of nodes
        subset of packages to limit the ranking to

    Returns
    -------
    immunization_set: set
        Set of packages to be immunized.

    """
    return {p[0] for p in ms.top(set_size, subset)}


def iset_delta_set_reach(olivia_model):
    """
    Compute an immunization set using the DELTA SET algorithm with the Reach metric.

    DELTA SET computes upper and lower bounds for the vulnerability reduction associated to the immunization of
    each package in the network and returns a set that is guaranteed to contain the single optimum package for
    immunization.

    The resulting set size is a product of the algorithm and cannot be selected.

    Parameters
    ----------
    olivia_model: OliviaNetwork
        Input network

    Returns
    -------
    immunization_set: set
        Set of packages to be immunized.

    """
    delta_upper = olivia_model.get_metric(Reach) * olivia_model.get_metric(Surface)
    delta_lower = olivia_model.get_metric(Reach) + olivia_model.get_metric(Surface) - 1
    max_lower = delta_lower.top()[0][1]
    return {p for p in olivia_model if delta_upper[p] > max_lower}


def iset_delta_set_impact(olivia_model):
    """
    Compute an immunization set using the DELTA SET algorithm with the Impact metric.

    DELTA SET computes upper and lower bounds for the vulnerability reduction associated to the immunization of
    each package in the network and returns a set that is guaranteed to contain the single optimum package for
    immunization.

    The resulting set size is a product of the algorithm and cannot be selected.

    Parameters
    ----------
    olivia_model: OliviaNetwork
        Input network

    Returns
    -------
    immunization_set: set
        Set of packages to be immunized.

    """
    delta_upper = olivia_model.get_metric(Impact) * olivia_model.get_metric(Surface)
    delta_lower = olivia_model.get_metric(DependentsCount) * olivia_model.get_metric(Surface)
    max_lower = delta_lower.top()[0][1]
    return {p for p in olivia_model if delta_upper[p] > max_lower}


def iset_sap(olivia_model, clusters=None):
    """
    Compute an immunization set detecting strong articulation points (SAP).

    Immunization of SAP in the strongly connected components (SCC) of the network can be very effective
    in networks with large SCCs.

    Large SCC play a crucial role in increasing the vulnerability of networks of dependencies. Strong articulation
    points are nodes whose removal would create additional strongly connected components, thus reducing the size of
    the larger SCC.

    The appearance of SCCs in real packet networks seems to follow a model similar to the formation of the giant
    component in Erdős-Rényi models. So the size of the largest SCC is usually much larger than the rest.

    The resulting set size is a product of the algorithm and cannot be selected.

    Parameters
    ----------
    olivia_model: OliviaNetwork
        Input network

    clusters: sets of nodes
        Iterable with sets of nodes forming SCCs in the network. If None the largest SCC is detected and used.

    Returns
    -------
    immunization_set: set
        Set of packages to be immunized corresponding to the SAP of the clusters.

    """
    if clusters is None:
        clusters = [olivia_model.sorted_clusters()[0]]
    sap = set()
    for c in clusters:
        scc = olivia_model.network.subgraph(c)
        sap.update(strong_articulation_points(scc))
    return sap


def iset_random(olivia_model, set_size, indirect=False, seed=None):
    """
    Compute an immunization set by randomly selecting packages.

    This method is useful for understanding the nature of a network's vulnerability and/or for
    establishing baseline immunization cases.

    Parameters
    ----------
    olivia_model: OliviaNetwork
        Input network
    set_size: int
        Number of packages in the immunization set.
    indirect: bool, optional
        Whether to use indirect selection or not. Using indirect selection the immunization set is constructed
        by randomly choosing a dependency of a randomly selected package.
    seed: int, optional
        Seed for the random number generator.

    Returns
    -------
    immunization_set: set
        Set of packages to be immunized.

    """
    packages = tuple(olivia_model)
    if seed:
        random.seed(seed)
    if indirect:
        result = set()
        while len(result) != set_size:
            dependencies = []
            while len(dependencies) == 0:
                current = random.choice(packages)
                dependencies = olivia_model[current].direct_dependencies()
            result.add(random.choice(tuple(dependencies)))
        return result
    else:
        return set(random.sample(packages, k=set_size))

Functions

def immunization_delta(net, n, cost_metric=olivia.packagemetrics.Reach, algorithm='network')

Compute the improvement in network vulnerability by immunizing a certain set of packages.

Parameters

net : OliviaNetwork: Input network.
n : container: Container of packages to be immunized.
cost_metric : class, optional: Metric to measure cost.
algorithm : 'network' or 'analytic'

Returns

result : float: Difference of network vulnerability after immunization of the elements in n.

Notes

'network' algorithm Implements the naive algorithm of removing immunized nodes and rebuilding model from scratch, so it is slow for big networks. Some obvious improvements could be made, but whether or not there is a much better alternative is an open question. 'analytic' algorithm uses only local information pertaining transitive relations of the elements to be immunized. This is faster for smaller networks and/or smaller immunization sets but slower otherwise. Only implemented for the Reach metric.

Expand source code

def immunization_delta(net, n, cost_metric=Reach, algorithm='network'):
    """
    Compute the improvement in network vulnerability by immunizing a certain set of packages.

    Parameters
    ----------
    net: OliviaNetwork
        Input network.
    n: container
        Container of packages to be immunized.
    cost_metric: class, optional
        Metric to measure cost.
    algorithm: 'network' or 'analytic'

    Returns
    -------
    result: float
        Difference of network vulnerability after immunization of the elements in n.

    Notes
    -----
    'network' algorithm Implements the naive algorithm of removing immunized nodes and rebuilding model from scratch,
    so it is slow for big networks. Some obvious improvements could be made, but whether or not there is a
    much better alternative is an open question.
    'analytic' algorithm uses only local information pertaining transitive relations of the elements to be
    immunized. This is faster for smaller networks and/or smaller immunization sets but slower otherwise. Only
    implemented for the Reach metric.

    """
    if algorithm == 'network':
        return _immunization_delta_network(net, n, cost_metric=cost_metric)
    elif algorithm == 'analytic' and cost_metric == Reach:
        return _immunization_delta_analytic(net, n)
    else:
        raise ValueError("Not implemented.")

def iset_delta_set_impact(olivia_model)

Compute an immunization set using the DELTA SET algorithm with the Impact metric.

DELTA SET computes upper and lower bounds for the vulnerability reduction associated to the immunization of each package in the network and returns a set that is guaranteed to contain the single optimum package for immunization.

The resulting set size is a product of the algorithm and cannot be selected.

Parameters

olivia_model : OliviaNetwork: Input network

Returns

immunization_set : set: Set of packages to be immunized.

Expand source code

def iset_delta_set_impact(olivia_model):
    """
    Compute an immunization set using the DELTA SET algorithm with the Impact metric.

    DELTA SET computes upper and lower bounds for the vulnerability reduction associated to the immunization of
    each package in the network and returns a set that is guaranteed to contain the single optimum package for
    immunization.

    The resulting set size is a product of the algorithm and cannot be selected.

    Parameters
    ----------
    olivia_model: OliviaNetwork
        Input network

    Returns
    -------
    immunization_set: set
        Set of packages to be immunized.

    """
    delta_upper = olivia_model.get_metric(Impact) * olivia_model.get_metric(Surface)
    delta_lower = olivia_model.get_metric(DependentsCount) * olivia_model.get_metric(Surface)
    max_lower = delta_lower.top()[0][1]
    return {p for p in olivia_model if delta_upper[p] > max_lower}

def iset_delta_set_reach(olivia_model)

Compute an immunization set using the DELTA SET algorithm with the Reach metric.

The resulting set size is a product of the algorithm and cannot be selected.

Parameters

olivia_model : OliviaNetwork: Input network

Returns

immunization_set : set: Set of packages to be immunized.

Expand source code

def iset_delta_set_reach(olivia_model):
    """
    Compute an immunization set using the DELTA SET algorithm with the Reach metric.

    DELTA SET computes upper and lower bounds for the vulnerability reduction associated to the immunization of
    each package in the network and returns a set that is guaranteed to contain the single optimum package for
    immunization.

    The resulting set size is a product of the algorithm and cannot be selected.

    Parameters
    ----------
    olivia_model: OliviaNetwork
        Input network

    Returns
    -------
    immunization_set: set
        Set of packages to be immunized.

    """
    delta_upper = olivia_model.get_metric(Reach) * olivia_model.get_metric(Surface)
    delta_lower = olivia_model.get_metric(Reach) + olivia_model.get_metric(Surface) - 1
    max_lower = delta_lower.top()[0][1]
    return {p for p in olivia_model if delta_upper[p] > max_lower}

def iset_naive_ranking(set_size, ms, subset=None)

Compute an immunization set by selecting top elements according to a metric.

Parameters

set_size : int: Number of packages in the immunization set.
ms : metricStats: Metric to measure cost.
subset : container of nodes: subset of packages to limit the ranking to

Returns

immunization_set : set: Set of packages to be immunized.

Expand source code

def iset_naive_ranking(set_size, ms, subset=None):
    """
    Compute an immunization set by selecting top elements according to a metric.

    Parameters
    ----------
    set_size: int
        Number of packages in the immunization set.
    ms: metricStats
        Metric to measure cost.
    subset: container of nodes
        subset of packages to limit the ranking to

    Returns
    -------
    immunization_set: set
        Set of packages to be immunized.

    """
    return {p[0] for p in ms.top(set_size, subset)}

def iset_random(olivia_model, set_size, indirect=False, seed=None)

Compute an immunization set by randomly selecting packages.

This method is useful for understanding the nature of a network's vulnerability and/or for establishing baseline immunization cases.

Parameters

olivia_model : OliviaNetwork: Input network
set_size : int: Number of packages in the immunization set.
indirect : bool, optional: Whether to use indirect selection or not. Using indirect selection the immunization set is constructed by randomly choosing a dependency of a randomly selected package.
seed : int, optional: Seed for the random number generator.

Returns

immunization_set : set: Set of packages to be immunized.

Expand source code

def iset_random(olivia_model, set_size, indirect=False, seed=None):
    """
    Compute an immunization set by randomly selecting packages.

    This method is useful for understanding the nature of a network's vulnerability and/or for
    establishing baseline immunization cases.

    Parameters
    ----------
    olivia_model: OliviaNetwork
        Input network
    set_size: int
        Number of packages in the immunization set.
    indirect: bool, optional
        Whether to use indirect selection or not. Using indirect selection the immunization set is constructed
        by randomly choosing a dependency of a randomly selected package.
    seed: int, optional
        Seed for the random number generator.

    Returns
    -------
    immunization_set: set
        Set of packages to be immunized.

    """
    packages = tuple(olivia_model)
    if seed:
        random.seed(seed)
    if indirect:
        result = set()
        while len(result) != set_size:
            dependencies = []
            while len(dependencies) == 0:
                current = random.choice(packages)
                dependencies = olivia_model[current].direct_dependencies()
            result.add(random.choice(tuple(dependencies)))
        return result
    else:
        return set(random.sample(packages, k=set_size))

def iset_sap(olivia_model, clusters=None)

Compute an immunization set detecting strong articulation points (SAP).

Immunization of SAP in the strongly connected components (SCC) of the network can be very effective in networks with large SCCs.

Large SCC play a crucial role in increasing the vulnerability of networks of dependencies. Strong articulation points are nodes whose removal would create additional strongly connected components, thus reducing the size of the larger SCC.

The appearance of SCCs in real packet networks seems to follow a model similar to the formation of the giant component in Erdős-Rényi models. So the size of the largest SCC is usually much larger than the rest.

The resulting set size is a product of the algorithm and cannot be selected.

Parameters

olivia_model : OliviaNetwork: Input network
clusters : sets of nodes: Iterable with sets of nodes forming SCCs in the network. If None the largest SCC is detected and used.

Returns

immunization_set : set: Set of packages to be immunized corresponding to the SAP of the clusters.

Expand source code

def iset_sap(olivia_model, clusters=None):
    """
    Compute an immunization set detecting strong articulation points (SAP).

    Immunization of SAP in the strongly connected components (SCC) of the network can be very effective
    in networks with large SCCs.

    Large SCC play a crucial role in increasing the vulnerability of networks of dependencies. Strong articulation
    points are nodes whose removal would create additional strongly connected components, thus reducing the size of
    the larger SCC.

    The appearance of SCCs in real packet networks seems to follow a model similar to the formation of the giant
    component in Erdős-Rényi models. So the size of the largest SCC is usually much larger than the rest.

    The resulting set size is a product of the algorithm and cannot be selected.

    Parameters
    ----------
    olivia_model: OliviaNetwork
        Input network

    clusters: sets of nodes
        Iterable with sets of nodes forming SCCs in the network. If None the largest SCC is detected and used.

    Returns
    -------
    immunization_set: set
        Set of packages to be immunized corresponding to the SAP of the clusters.

    """
    if clusters is None:
        clusters = [olivia_model.sorted_clusters()[0]]
    sap = set()
    for c in clusters:
        scc = olivia_model.network.subgraph(c)
        sap.update(strong_articulation_points(scc))
    return sap