Source code for grape.fault_diagnosis

"""FaultDiagnosis module"""

import logging
import sys
import warnings
import multiprocessing as mp
import random
import networkx as nx
import numpy as np
import pandas as pd
from deap import base, creator, tools

from .utils import chunk_it
from .general_graph import GeneralGraph
from .parallel_general_graph import ParallelGeneralGraph

warnings.simplefilter(action='ignore', category=FutureWarning)
logging.basicConfig(stream=sys.stdout, level=logging.DEBUG)


[docs]class FaultDiagnosis():
    """Class FaultDiagnosis.

    Perturbation of a GeneralGraph object.
    Perturbation can be simulated on a list of elements.
    From one element, the perturbation propagates in all directions,
    unless an isolating element is present.
    """

[docs]    def __init__(self, filename, parallel=False):
        """

        Create an input graph, with the structure contained in the input file.

        :param str filename: input file in CSV format.
        :param parallel: flag for parallel graph creation,
            default to False.
        :type parallel: bool, optional
        """

        if parallel:
            self.G = ParallelGeneralGraph()
        else:
            self.G = GeneralGraph()

        self.df, self.edges_df = self.G.load(filename)
        self.paths_df = None

[docs]    def check_input_with_gephi(self):
        """

        Write list of nodes and list of edges CSV format files,
        to visualize the input with Gephi.
        """

        gephi_nodes_df = self.df.reset_index()
        gephi_nodes_df.rename(columns={'index': 'mark'}, inplace=True)

        fields = [ 'mark', 'description', 'init_status' ]
        cols_to_str = ['init_status']
        gephi_nodes_df[cols_to_str] = gephi_nodes_df[cols_to_str].astype(str)
        conversions = {'nan': '', '1.0': '1', '0.0': '0'}
        gephi_nodes_df['init_status'].replace(to_replace=conversions,
            inplace=True)

        gephi_nodes_df[fields].to_csv('check_import_nodes.csv', index=False)

        orphans = self.edges_df['father_mark'].str.contains('NULL')
        self.edges_df = self.edges_df[~orphans]
        self.edges_df.to_csv('check_import_edges.csv', index=False)

[docs]    def fitness_iteration_parallel(self, out_queue, ichunk, chunk_length,
        individuals, perturbed_nodes, initial_condition):
        """

        Parallel iteration for fitness evaluation. We append to the
        multiprocessing queue a tuple constituted by constituted by the
        index of the individual, the individual itself, and its fitness.

        :param multiprocessing.queues.Queue out_queue: multiprocessing queue
        :param int ichunk: index of the chunk under consideration.
        :param int chunk_length: lengths of the chunks (the last chunk may
            be shorter due to non-even division of the number of generations by
            the number of processors).
        :param list individuals: list of individuals on which to perform
            fitness evaluation.
        :param list perturbed_nodes: nodes(s) involved in the perturbing event.
        :param dict initial_condition: initial status (boolean) for the graph
            switches.
        """

        for idx, item in enumerate(individuals):
            ind_fit = (ichunk*chunk_length + idx, item,
                self.fitness_evaluation(item, perturbed_nodes,
                initial_condition))
            out_queue.put(ind_fit)

[docs]    def fitness_evaluation_parallel(self, pop, perturbed_nodes,
        initial_condition):
        """

        Wrapper for fitness evaluation. This methods spawns the processes for
        fitness evaluation and collects the results.

        :param list pop: list of individuals.
        :param list perturbed_nodes: nodes(s) involved in the perturbing event.
        :param dict initial_condition: initial status (boolean) for the graph
            switches.

        :return: list of tuples constituted by the index of the individual,
            the individual itself, and its fitness.
        :rtype: list
        """

        n_procs = mp.cpu_count()

        fitnesses_tuples = []
        out_queue = mp.Queue()
        ind_chunks = chunk_it(pop, n_procs)

        processes = [
            mp.Process( target=self.fitness_iteration_parallel,
            args=( out_queue, p, len(ind_chunks[0]), ind_chunks[p],
                perturbed_nodes, initial_condition ))
                for p in range(n_procs) ]

        for proc in processes:
            proc.start()

        while 1:
            running = any(p.is_alive() for p in processes)
            while not out_queue.empty():

                fitnesses_tuples.append(out_queue.get())

            if not running:
                break

        return fitnesses_tuples

[docs]    def fitness_evaluation(self, individual, perturbed_nodes,
        initial_condition):
        """

        Evaluation of fitness on individual.
        The individual is a list of conditions for the graph switches
        (True or False).
        Edges connecting its predecessors are removed if the switch state
        is set to 'False'.

        :param list individual: element on which to compute the fitness.
        :param list perturbed_nodes: nodes(s) involved in the
            perturbing event.
        :param dict initial_condition: initial status (boolean) for the graph
            switches.
        """

        acts = np.sum(np.not_equal(list(initial_condition.values()),
            individual))

        T = GeneralGraph()
        T.add_nodes_from(self.G)
        for (u, v, d) in self.G.edges(data=True):
            T.add_edge(u, v, weight=d['weight'])
        nx.set_node_attributes(T, self.G.initial_service,
            name='initial_service')
        nx.set_node_attributes(T, self.G.type, name='type')

        for switch, status in zip(initial_condition.keys(), individual):
            if not status:
                for pred in list(T.predecessors(switch)):
                    T.remove_edge(pred, switch)

        for node in perturbed_nodes:
            if node in T.nodes():

                _, broken_nodes = self.rm_nodes(node, T)
                broken_nodes = list(set(broken_nodes))

                for n in broken_nodes:
                    T.remove_node(n)

        serv_at_usr = {key: T.service[key] for key in T.users}
        usr_with_serv = {key: serv_at_usr[key] for key in serv_at_usr.keys()
            if serv_at_usr[key] > 0.0}

        avg_service = sum(T.service.values())
        if len(usr_with_serv.keys()) != 0:
            avg_service /= len(usr_with_serv.keys())
        dist_from_avg =  {k: abs(v - avg_service)
            for k, v in usr_with_serv.items()}

        return (acts, sum(T.service.values()), len(T),
            len(usr_with_serv.keys()), sum(dist_from_avg.values()))

[docs]    def optimizer(self, perturbed_nodes, initial_condition, params, weights,
        parallel):
        """

        Genetic algorithm to optimize switches conditions, using DEAP.

        :param list perturbed_nodes: nodes(s) involved in the perturbing event.
        :param dict initial_condition: initial status (boolean) for the graph
            switches.
        :param dict params: values for the optimizer evolutionary algorithm.
            Dict of: {str: int, str: int, str: float, str: float, str: int}.
            - 'npop': number of individuals for each population (default to 300)
            - 'ngen': total number of generations (default to 100)
            - 'indpb': independent probability for attributes to be changed
            (default to 0.6)
            - 'tresh': threshold for applying crossover/mutation
            (default to 0.5)
            - 'nsel': number of individuals to select (default to 5)
        :param dict weights: weights for fitness evaluation on individuals.
            Dict of: {str: float, str: float, str: float}:
            - 'w1': weight multiplying number of switch flips (default to 1.0)
            - 'w2': weight multiplying total final service (default to -1.0)
            - 'w3': weight multiplying final graph size (default to -1.0)
            - 'w4': weight multiplying number of users with non-zero service
                (default to -1.0)
            - 'w5': weight for service balance over users (default to 2.0)
        :param bool parallel: flag for parallel fitness evaluation of
            initial populations.
        """

        logging.getLogger().setLevel(logging.INFO)
        w = np.asarray(list(weights.values()))

        creator.create("FitnessMin", base.Fitness, weights=(-1.0,))
        creator.create("Individual", list, fitness=creator.FitnessMin)

        toolbox = base.Toolbox()
        # Attribute generator
        toolbox.register("attribute_bool", random.choice, [True, False])
        # Structure initializers
        toolbox.register("individual", tools.initRepeat, creator.Individual,
            toolbox.attribute_bool, len(self.G.switches))
        toolbox.register("population", tools.initRepeat, list,
            toolbox.individual)

        toolbox.register("evaluate", self.fitness_evaluation)
        toolbox.register("mate", tools.cxUniform, indpb=params['indpb'])
        toolbox.register("mutate", tools.mutFlipBit, indpb=params['indpb'])

        pop = toolbox.population(n=params['npop'])

        # Evaluate the entire population
        if (not parallel) or (len(pop) < mp.cpu_count()):
            fitnesses = [toolbox.evaluate(ind, perturbed_nodes,
                initial_condition) for ind in pop]
        else:
            res_par = self.fitness_evaluation_parallel(pop, perturbed_nodes,
                initial_condition)
            res_par.sort(key=lambda x:x[0])
            fitnesses = [x[2] for x in res_par]

        for ind, f in zip(pop, fitnesses):
            ind.fitness.values = (np.dot(w, np.asarray(f)),)

        # Generations
        g = 0
        result = []

        pop = [list(couple) for couple in zip(pop, fitnesses)]
        pop.sort(key=lambda x: np.dot(w, np.asarray(x[1])))

        while g < params['ngen']:

            g = g + 1

            # Select next generation
            offspring = [x[0] for x in pop[:params['nsel']]]
            pop = pop[:params['nsel']]

            invalid_ind = []

            # Crossover and mutation on the offspring
            for parent1, parent2 in zip(offspring[::2], offspring[1::2]):
                if random.random() < params['tresh']:
                    child1 = toolbox.clone(parent1)
                    child2 = toolbox.clone(parent2)
                    toolbox.mate(child1, child2)
                    del child1.fitness.values
                    invalid_ind.append(child1)
                    del child2.fitness.values
                    invalid_ind.append(child2)

            for ind in offspring:
                if random.random() < params['tresh']:
                    mutant = toolbox.clone(ind)
                    toolbox.mutate(mutant)
                    del mutant.fitness.values
                    invalid_ind.append(mutant)

            # Evaluate the individuals with an invalid fitness
            if (not parallel) or (len(invalid_ind) < mp.cpu_count()):
                fitnesses = [toolbox.evaluate(ind, perturbed_nodes,
                    initial_condition) for ind in invalid_ind]
            else:
                res_par = self.fitness_evaluation_parallel(invalid_ind,
                    perturbed_nodes, initial_condition)
                res_par.sort(key=lambda x:x[0])
                fitnesses = [x[2] for x in res_par]

            for ind, f in zip(invalid_ind, list(fitnesses)):
                ind.fitness.values = (np.dot(w, np.asarray(f)),)

            ind_fit_invalid = [list(couple) for couple in zip(invalid_ind,
                fitnesses)]

            pop[:] = pop[:] + ind_fit_invalid[:]

            # Sort the population according to fitness
            pop.sort(key=lambda x: np.dot(w, np.asarray(x[1])))

            # Extracting best state
            result.append(pop[0])

        logging.getLogger().setLevel(logging.DEBUG)

        return result

[docs]    def check_paths_and_measures(self, prefix=None):
        """

        Describe the topology of the graph.
        Compute efficiency measures for the whole graph and its nodes.
        Check the availability of paths between source and target nodes.

        :param prefix: prefix to be added to column name,
            default to None.
        :type prefix: str, optional

        """

        source_user_paths = []

        measure_fields = ['nodal_efficiency', 'local_efficiency', 'service']
        self.update_output(measure_fields, prefix=prefix)

        centrality_fields = ['closeness_centrality', 'betweenness_centrality',
            'indegree_centrality', 'outdegree_centrality', 'degree_centrality']
        self.update_output(centrality_fields, prefix=prefix)

        for source in self.G.sources:
            for user in self.G.users:
                if nx.has_path(self.G, source, user):

                    all_paths = list(nx.all_simple_paths(self.G, source, user))
                    shpath = self.G.shortest_path[source][user]
                    shpath_length = self.G.shortest_path_length[source][user]
                    neff = 1 / shpath_length
                    ids = source + user

                else:

                    all_paths = 'NO_PATH'
                    shpath = 'NO_PATH'
                    shpath_length = 'NO_PATH'
                    neff = 'NO_PATH'
                    ids = source + user

                source_user_paths.append({
                    'from': source,
                    'to': user,
                    str(prefix + 'shortest_path_length'): shpath_length,
                    str(prefix + 'shortest_path'): shpath,
                    str(prefix + 'simple_path'): all_paths,
                    str(prefix + 'pair_efficiency'): neff,
                    'ids': ids
                })

        if source_user_paths:
            df = pd.DataFrame(source_user_paths)
            if self.paths_df is None:
                self.paths_df = df
            else:
                self.paths_df = pd.merge(self.paths_df, df,
                    on=['from', 'to', 'ids'], how='outer')

[docs]    def rm_nodes(self, node, graph, visited=None, broken_nodes=None):
        """

        Remove nodes from the graph in a depth first search way to
        propagate the perturbation.

        :param str node: the id of the node to remove.
        :param nx.DiGraph graph: graph on which to apply the node deletion
        :param visited: nodes already visited, default to None.
        :type visited: set, optional
        :param broken_nodes: nodes that got broken along the perturbation,
            default to None.
        :type broken_nodes: list, optional
        """

        if visited is None:
            visited = set()
            broken_nodes = []
        visited.add(node)
        logging.debug('Visited: %s', visited)
        logging.debug('Node: %s', node)

        broken_nodes.append(node)
        logging.debug('Nodes broken so far: %s', broken_nodes)

        for next_node in set(graph[node]) - visited:
            self.rm_nodes(next_node, graph, visited, broken_nodes)

        return visited, broken_nodes

[docs]    def update_output(self, attribute_list, prefix=str()):
        """

        Update columns output DataFrame with attributes
        in attribute_list.

        :param list attribute_list: list of attributes to be updated
            to the output DataFrame.
        :param prefix: prefix to be added to column name,
            default to empty string.
        :type prefix: str, optional
        """

        for col in attribute_list:
            self.df[prefix + col] = pd.Series(getattr(self.G, col))

[docs]    def delete_a_node(self, node):
        """

        Delete a node in the graph.

        :param str node: the id of the node to remove.

        .. warning:: the node id must be contained in the graph.
            No check is done within this function.
        """

        _ , broken_nodes = self.rm_nodes(node, self.G)
        broken_nodes = list(set(broken_nodes))
        self.G._del_nodes.extend(broken_nodes)

        self.G._del_edges.extend(list(self.G.in_edges(nbunch=broken_nodes,
            data=True)))
        self.G._del_edges.extend(list(self.G.out_edges(nbunch=broken_nodes,
            data=True)))

        for n in broken_nodes:
            self.G.remove_node(n)

[docs]    def apply_perturbation(self, perturbed_nodes, params, weights, parallel,
        verbose, kind='element'):
        """

        Perturbation simulator, actually applying the perturbation
        to all the nodes.
        The optimizer is run if any switch is present, and edges connecting
        its predecessors are removed if the switch state is set to 'False'.

        :param list perturbed_nodes: nodes(s) involved in the
            perturbing event.
        :param dict params: values for the optimizer evolutionary algorithm.
            Dict of: {str: int, str: int, str: float, str: float, str: int}:
            - 'npop': number of individuals for each population (default to 300)
            - 'ngen': total number of generations (default to 100)
            - 'indpb': independent probability for attributes to be changed
            (default to 0.6)
            - 'tresh': threshold for applying crossover/mutation
            (default to 0.5)
            - 'nsel': number of individuals to select (default to 5)
        :param dict weights: weights for fitness evaluation on individuals.
            Dict of: {str: float, str: float, str: float}:
            - 'w1': weight multiplying number of switch flips (default to 1.0)
            - 'w2': weight multiplying total final service (default to -1.0)
            - 'w3': weight multiplying final graph size (default to -1.0)
            - 'w4': weight multiplying number of users with non-zero service
                (default to -1.0)
            - 'w5': weight for service balance over users (default to 2.0)
        :param bool parallel: flag for parallel fitness evaluation of
            initial population.
        :param bool verbose: flag for verbose printing.
        :param str kind: type of simulation, used to label output files,
            default to 'element'.

        .. note:: A perturbation, depending on the considered system,
            may spread in all directions starting from the damaged
            component(s) and may be affect nearby elements.
        """

        if self.G.switches:

            res = self.optimizer(perturbed_nodes, self.G.init_status, params,
                weights, parallel)
            w = np.asarray(list(weights.values()))

            if verbose:
                with open('results_generations.dat', 'w', encoding='utf8') as f:
                    for r in res:
                        f.write(f'{self.G.init_status.items()}')
                        f.write(f'{r[0]} {r[1]}')
                        fit = np.dot(w, np.asarray(r[1]))
                        f.write(f'{fit}\n')

            res.sort(key=lambda x: np.dot(w, np.asarray(x[1])))
            best = dict(zip(self.G.init_status.keys(), res[0][0]))

            initial_condition_sw = list(self.G.init_status.values())
            final_condition_sw = list(best.values())
            flips = dict(zip(self.G.init_status.keys(),
                np.not_equal(initial_condition_sw, final_condition_sw)))

        init_open_edges = {}
        for sw, status_sw in self.G.init_status.items():
            if not status_sw:
                logging.debug('False switch %s in initial configuration', sw)
                init_open_edges[sw] = {}
                for pred in list(self.G.predecessors(sw)):
                    # if final config is closed for this switch I memorize it
                    if flips[sw]:
                        init_open_edges[sw][pred] = self.G[pred][sw]
                    self.G.remove_edge(pred, sw)

        self.check_paths_and_measures(prefix='original_')

        self.G.clear_data(['shortest_path', 'shortest_path_length',
            'efficiency', 'nodal_efficiency', 'local_efficiency',
            'computed_service', 'closeness_centrality',
            'betweenness_centrality', 'indegree_centrality',
            'outdegree_centrality', 'degree_centrality'])

        if self.G.switches:
            for sw, status_sw in best.items():
                if flips[sw]:

                    if not status_sw:
                        logging.debug('Switch %s finally False, first True',
                        sw)
                        for pre in list(self.G.predecessors(sw)):
                            self.G.remove_edge(pre, sw)

                    else:
                        logging.debug('Switch %s finally True, first False',
                        sw)
                        for pre, attrs in init_open_edges[sw].items():
                            self.G.add_edge(pre, sw, **attrs)

            print(f'\nBEST: {best}')
            print(f'Number of switch flips: {res[0][1][0]}')
            print(f'Total final service: {res[0][1][1]}')
            print(f'Number of survived nodes: {res[0][1][2]}')
            print(f'Number of users with non-zero service: {res[0][1][3]}')
            print(f'Distance from average: {res[0][1][4]}')
            fit = np.dot(w, np.asarray(res[0][1]))
            print(f'\nFor a final loss of: {fit}\n')
            self.G.final_status = best

        for node in perturbed_nodes:
            print(f'Perturbed nodes: {perturbed_nodes}')
            if node in self.G.nodes():
                self.delete_a_node(node)

        self.check_paths_and_measures(prefix='final_')
        self.paths_df.to_csv('service_paths_' + str(kind)+ '_perturbation.csv',
            index=False)

        status_fields = ['final_status', 'mark_status']
        self.update_output(status_fields)

        self.graph_characterization_to_file(str(kind) + '_perturbation.csv')

[docs]    def simulate_element_perturbation(self, perturbed_nodes,
        params={'npop': 300, 'ngen': 100, 'indpb': 0.6, 'tresh': 0.5,
        'nsel': 5}, weights={'w1': 1.0, 'w2': -1.0, 'w3': -1.0, 'w4': -1.0,
        'w5': 2.0}, parallel=False, verbose=True):
        """

        Simulate a perturbation of one or multiple nodes.

        :param list perturbed_nodes: nodes(s) involved in the perturbing event.
        :param params: values for the optimizer evolutionary algorithm.
            Dict of: {str: int, str: int, str: float, str: float, str: int}:
            - 'npop': number of individuals for each population (default to 300)
            - 'ngen': total number of generations (default to 100)
            - 'indpb': independent probability for attributes to be changed
            (default to 0.6)
            - 'tresh': threshold for applying crossover/mutation
            (default to 0.5)
            - 'nsel': number of individuals to select (default to 5)
        :type params: dict, optional
        :param weights: weights for fitness evaluation on individuals.
            Dict of: {str: float, str: float, str: float}:
            - 'w1': weight multiplying number of switch flips (default to 1.0)
            - 'w2': weight multiplying total final service (default to -1.0)
            - 'w3': weight multiplying final graph size (default to -1.0)
            - 'w4': weight multiplying number of users with non-zero service
                (default to -1.0)
            - 'w5': weight for service balance over users (default to 2.0)
        :type weights: dict, optional
        :param parallel: flag for parallel fitness evaluation of
            initial population, default to False.
        :type parallel: bool, optional
        :param verbose: flag for verbose output, default to True.
        :type verbose: bool, optional
            different kinds of perturbations, default to None.

        .. note:: A perturbation, depending on the considered system,
            may spread in all directions starting from the damaged
            component(s) and may be affect nearby elements.

        :raises: SystemExit
        """

        for node in perturbed_nodes:

            if node not in self.G.nodes():
                logging.debug('The node %s is not in the graph', node)
                logging.debug('Insert a valid node')
                logging.debug('Valid nodes: %s', self.G.nodes())
                sys.exit()

        self.apply_perturbation(perturbed_nodes, params, weights, parallel,
            verbose, kind='element')

[docs]    def graph_characterization_to_file(self, filename):
        """

        Write to file graph characterization after the perturbation.
        File is written in CSV format.

        :param str filename: output file name where to write the
            graph characterization.
        """

        self.df.reset_index(inplace=True)
        self.df.rename(columns={'index': 'mark'}, inplace=True)

        fields = [
            'mark', 'description', 'init_status', 'final_status', 'mark_status',
            'original_closeness_centrality', 'final_closeness_centrality',
            'original_betweenness_centrality', 'final_betweenness_centrality',
            'original_indegree_centrality', 'final_indegree_centrality',
            'original_outdegree_centrality', 'final_outdegree_centrality',
            'original_local_efficiency', 'final_local_efficiency',
            'original_nodal_efficiency', 'final_nodal_efficiency',
            'original_service', 'final_service'
        ]
        self.df[['init_status', 'final_status']] = self.df[['init_status',
            'final_status']].astype(str)
        conversions = {'nan': '', '1.0': '1', '0.0': '0'}
        self.df[['init_status', 'final_status']] = self.df[['init_status',
            'final_status']].replace(to_replace=conversions)
        self.df[fields].to_csv(filename, index=False)