Source code for pm4py.statistics.start_activities.log.get

from pm4py.util.xes_constants import DEFAULT_NAME_KEY
from pm4py.util import exec_utils
from pm4py.util import constants
from enum import Enum
from typing import Optional, Dict, Any, Union
from pm4py.objects.log.obj import EventLog
from pm4py.objects.conversion.log import converter as log_converter


[docs] class Parameters(Enum): ATTRIBUTE_KEY = constants.PARAMETER_CONSTANT_ATTRIBUTE_KEY ACTIVITY_KEY = constants.PARAMETER_CONSTANT_ACTIVITY_KEY START_TIMESTAMP_KEY = constants.PARAMETER_CONSTANT_START_TIMESTAMP_KEY TIMESTAMP_KEY = constants.PARAMETER_CONSTANT_TIMESTAMP_KEY CASE_ID_KEY = constants.PARAMETER_CONSTANT_CASEID_KEY MAX_NO_POINTS_SAMPLE = "max_no_of_points_to_sample" KEEP_ONCE_PER_CASE = "keep_once_per_case"
[docs] def get_start_activities( log: EventLog, parameters: Optional[Dict[Union[str, Parameters], Any]] = None, ) -> Dict[str, int]: """ Get the start attributes of the log along with their count Parameters ---------- log Log parameters Parameters of the algorithm, including: Parameters.ACTIVITY_KEY -> Attribute key (must be specified if different from concept:name) Returns ---------- start_activities Dictionary of start attributes associated with their count """ if parameters is None: parameters = {} attribute_key = exec_utils.get_param_value( Parameters.ACTIVITY_KEY, parameters, DEFAULT_NAME_KEY ) log = log_converter.apply( log, variant=log_converter.Variants.TO_EVENT_LOG, parameters=parameters ) start_activities = {} for trace in log: if len(trace) > 0: if attribute_key in trace[0]: activity_first_event = trace[0][attribute_key] if activity_first_event not in start_activities: start_activities[activity_first_event] = 0 start_activities[activity_first_event] = ( start_activities[activity_first_event] + 1 ) return start_activities