Source code for pm4py.algo.organizational_mining.sna.util

'''
    PM4Py – A Process Mining Library for Python
Copyright (C) 2024 Process Intelligence Solutions UG (haftungsbeschränkt)

This program is free software: you can redistribute it and/or modify
it under the terms of the GNU Affero General Public License as
published by the Free Software Foundation, either version 3 of the
License, or any later version.

This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU Affero General Public License for more details.

You should have received a copy of the GNU Affero General Public License
along with this program.  If not, see this software project's root or
visit <https://www.gnu.org/licenses/>.

Website: https://processintelligence.solutions
Contact: info@processintelligence.solutions
'''
from typing import List, Dict
from enum import Enum
from pm4py.util import exec_utils, nx_utils
from pm4py.objects.org.sna.obj import SNA
import numpy as np


[docs] class Parameters(Enum): WEIGHT_THRESHOLD = "weight_threshold"
[docs] def sna_result_to_nx_graph(sna: SNA, parameters=None): """ Transforms the results of SNA to a NetworkX Graph / DiGraph object (depending on the type of analysis). Parameters ------------------ sna Result of a SNA operation parameters Parameters of the algorithm, including: - Parameters.WEIGHT_THRESHOLD => the weight threshold (used to filter out edges) Returns ----------------- nx_graph NetworkX Graph / DiGraph """ if parameters is None: parameters = {} weight_threshold = exec_utils.get_param_value( Parameters.WEIGHT_THRESHOLD, parameters, 0.0 ) directed = sna.is_directed if directed: graph = nx_utils.DiGraph() else: graph = nx_utils.Graph() graph.add_edges_from( {c for c, w in sna.connections.items() if w >= weight_threshold} ) return graph
[docs] def cluster_affinity_propagation( sna: SNA, parameters=None ) -> Dict[str, List[str]]: """ Performs a clustering using the affinity propagation algorithm provided by Scikit Learn Parameters -------------- sna Result of a SNA operation parameters Parameters of the algorithm Returns -------------- clustering Dictionary that contains, for each cluster that has been identified, the list of resources of the cluster """ from pm4py.util import ml_utils if parameters is None: parameters = {} originators = list( set(x[0] for x, y in sna.connections.items()).union( set(x[1] for x, y in sna.connections.items()) ) ) matrix = np.zeros((len(originators), len(originators))) for c, w in sna.connections.items(): matrix[originators.index(c[0]), originators.index(c[1])] = w affinity_propagation = ml_utils.AffinityPropagation(**parameters) affinity_propagation.fit(matrix) clusters = affinity_propagation.predict(matrix) ret = {} for i in range(len(clusters)): res = originators[i] cluster = str(clusters[i]) if cluster not in ret: ret[cluster] = [] ret[cluster].append(res) return ret