Skip to content

Commit

Permalink
Merge branch 'ft-1137-etconformance-dfg-new' into 'integration'
Browse files Browse the repository at this point in the history
FT 1137 ETConformance on DFG

See merge request pm4py/pm4py-core!500
  • Loading branch information
fit-sebastiaan-van-zelst committed Oct 15, 2021
2 parents 829f091 + 490b6b1 commit 841e3e5
Show file tree
Hide file tree
Showing 3 changed files with 93 additions and 2 deletions.
3 changes: 1 addition & 2 deletions pm4py/algo/evaluation/precision/__init__.py
Original file line number Diff line number Diff line change
@@ -1,2 +1 @@
from pm4py.algo.evaluation.precision import algorithm, variants, utils

from pm4py.algo.evaluation.precision import algorithm, variants, utils, dfg
1 change: 1 addition & 0 deletions pm4py/algo/evaluation/precision/dfg/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
from pm4py.algo.evaluation.precision.dfg import algorithm
91 changes: 91 additions & 0 deletions pm4py/algo/evaluation/precision/dfg/algorithm.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,91 @@
from collections import Counter
from enum import Enum
from typing import Optional, Dict, Any, Union, Tuple

from pm4py.objects.conversion.log import converter as log_converter
from pm4py.objects.log.obj import EventLog, EventStream
from pm4py.util import exec_utils, xes_constants, constants


class Parameters(Enum):
ACTIVITY_KEY = constants.PARAMETER_CONSTANT_ACTIVITY_KEY


def __is_allowed_prefix(exiting_activities, sa, prefix):
if not prefix:
return True
if prefix[0] not in sa:
return False
prev_act = prefix[0]
for i in range(1, len(prefix)):
curr_act = prefix[i]
if prev_act not in exiting_activities or curr_act not in exiting_activities[prev_act]:
return False
prev_act = curr_act
if not prefix[-1] in exiting_activities:
return False
return True


def apply(log: Union[EventLog, EventStream], dfg: Dict[Tuple[str, str], int],
start_activities: Dict[str, int], end_activities: Dict[str, int],
parameters: Optional[Dict[Union[str, Parameters], Any]] = None) -> float:
"""
Computes the precision of a directly-follows graph using the ETConformance approach
Parameters
---------------
log
Event log
dfg
Directly-follows graph
start_activities
Start activities
end_activities
End activities
parameters
Parameters of the algorithm:
- Parameters.ACTIVITY_KEY: the key to use
Returns
----------------
precision
Precision value
"""
if parameters is None:
parameters = {}
activity_key = exec_utils.get_param_value(Parameters.ACTIVITY_KEY, parameters, xes_constants.DEFAULT_NAME_KEY)

log = log_converter.apply(log, parameters=parameters)

precision = 1.0
sum_ee = 0
sum_at = 0
exiting_activities = {}
for act_couple in dfg:
if not act_couple[0] in exiting_activities:
exiting_activities[act_couple[0]] = set()
exiting_activities[act_couple[0]].add(act_couple[1])
prefixes = {}
prefixes_count = Counter()
for trace in log:
prefix_act = []
for i in range(len(trace)):
prefix_act_tuple = tuple(prefix_act)
if prefix_act_tuple not in prefixes:
prefixes[prefix_act_tuple] = set()
prefixes_count[prefix_act_tuple] += 1
prefixes[prefix_act_tuple].add(trace[i][activity_key])
prefix_act.append(trace[i][activity_key])
for prefix in prefixes:
if __is_allowed_prefix(exiting_activities, start_activities, prefix):
log_transitions = prefixes[prefix]
activated_transitions = set(start_activities.keys()) if not prefix else exiting_activities[prefix[-1]]
escaping_edges = activated_transitions.difference(log_transitions)
sum_ee += len(escaping_edges) * prefixes_count[prefix]
sum_at += len(activated_transitions) * prefixes_count[prefix]

if sum_at > 0:
precision = 1 - float(sum_ee) / float(sum_at)

return precision

0 comments on commit 841e3e5

Please sign in to comment.