{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Process mining and causal discovery example" ] }, { "cell_type": "code", "execution_count": 24, "metadata": {}, "outputs": [], "source": [ "! pip install sax4bpm" ] }, { "cell_type": "code", "execution_count": 25, "metadata": {}, "outputs": [], "source": [ "import warnings\n", "warnings.filterwarnings('ignore', category=RuntimeWarning)\n", "warnings.filterwarnings('ignore', category=UserWarning)" ] }, { "cell_type": "code", "execution_count": 26, "metadata": {}, "outputs": [], "source": [ "import sax\n", "from sax.core.process_data.formatters.xes_formatter import XESFormatter\n", "from sax.core.process_data.formatters.csv_formatter import CSVFormatter\n", "from sax.core.utils.constants import Constants\n", "from lingam.utils import make_dot\n", "from sax.core.process_data.tabular_data import TabularEventData\n", "from pm4py.objects.conversion.log import converter as log_converter\n", "import sax.core.process_mining.process_mining as pm" ] }, { "cell_type": "code", "execution_count": 27, "metadata": {}, "outputs": [], "source": [ "#Import event log file and create event_log data object\n", "fileName = \"simulated_run_non_overlapping_gen.csv\"\n", "event_log = pm.import_csv(eventlog=fileName,kloop_unroling=False,timestamp_format=\"%Y-%m-%d %H:%M:%S.%f\")\n" ] }, { "cell_type": "code", "execution_count": 28, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | Id | \n", "Source | \n", "Type | \n", "Timestamp | \n", "Resource | \n", "Role | \n", "start:timestamp | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "2182 | \n", "EVENT 1 START | \n", "assign | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "Owner2 | \n", "Administrator | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "
1 | \n", "2182 | \n", "EVENT 1 START | \n", "start | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "Owner2 | \n", "Lawyer | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "
2 | \n", "2182 | \n", "EVENT 1 START | \n", "complete | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "Owner1 | \n", "Administrator | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "
3 | \n", "2182 | \n", "assign | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "Owner3 | \n", "Lawyer | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "|
4 | \n", "2182 | \n", "Archive | \n", "assign | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "Owner1 | \n", "Technician | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
149980 | \n", "686 | \n", "Close Application | \n", "start | \n", "2023-02-03 10:57:38.527000+00:00 | \n", "Owner3 | \n", "Administrator | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "
149981 | \n", "686 | \n", "Close Application | \n", "complete | \n", "2023-02-03 10:57:44.397227+00:00 | \n", "Owner3 | \n", "Administrator | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "
149982 | \n", "686 | \n", "EVENT 7 END | \n", "assign | \n", "2023-02-03 10:57:44.397227+00:00 | \n", "Owner3 | \n", "Lawyer | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "
149983 | \n", "686 | \n", "EVENT 7 END | \n", "start | \n", "2023-02-03 10:57:44.397227+00:00 | \n", "Owner3 | \n", "Lawyer | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "
149984 | \n", "686 | \n", "EVENT 7 END | \n", "complete | \n", "2023-02-03 10:57:44.397227+00:00 | \n", "Owner1 | \n", "Lawyer | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "
149985 rows × 7 columns
\n", "\n", " | Id | \n", "Source | \n", "Type | \n", "Timestamp | \n", "Resource | \n", "Role | \n", "start:timestamp | \n", "
---|---|---|---|---|---|---|---|
1 | \n", "2182 | \n", "EVENT 1 START | \n", "start | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "Owner2 | \n", "Lawyer | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "
5 | \n", "2182 | \n", "start | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "Owner2 | \n", "Technician | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "|
6 | \n", "2182 | \n", "Archive | \n", "start | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "Owner2 | \n", "Administrator | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "
10 | \n", "2182 | \n", "Close Application | \n", "start | \n", "2023-02-24 12:02:36.506000+00:00 | \n", "Owner3 | \n", "Technician | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "
13 | \n", "2182 | \n", "EVENT 7 END | \n", "start | \n", "2023-02-24 12:02:43.253164+00:00 | \n", "Owner3 | \n", "Technician | \n", "2023-02-24 12:02:25.523000+00:00 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
149971 | \n", "686 | \n", "EVENT 1 START | \n", "start | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "Owner1 | \n", "Lawyer | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "
149975 | \n", "686 | \n", "start | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "Owner3 | \n", "Technician | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "|
149976 | \n", "686 | \n", "Archive | \n", "start | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "Owner3 | \n", "Technician | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "
149980 | \n", "686 | \n", "Close Application | \n", "start | \n", "2023-02-03 10:57:38.527000+00:00 | \n", "Owner3 | \n", "Administrator | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "
149983 | \n", "686 | \n", "EVENT 7 END | \n", "start | \n", "2023-02-03 10:57:44.397227+00:00 | \n", "Owner3 | \n", "Lawyer | \n", "2023-02-03 10:57:28.275000+00:00 | \n", "
49995 rows × 7 columns
\n", "\n", " | Id | \n", "start:timestamp | \n", "Archive | \n", "Close Application | \n", "EVENT 1 START | \n", "EVENT 7 END | \n", "|
---|---|---|---|---|---|---|---|
0 | \n", "0 | \n", "2023-01-25 09:00:00+00:00 | \n", "2023-01-25 09:00:10.743000+00:00 | \n", "2023-01-25 09:00:17.152773+00:00 | \n", "2023-01-25 09:00:00+00:00 | \n", "2023-01-25 09:00:17.152773+00:00 | \n", "2023-01-25 09:00:06.406000+00:00 | \n", "
1 | \n", "1 | \n", "2023-01-25 09:01:12.348000+00:00 | \n", "2023-01-25 09:01:21.402000+00:00 | \n", "2023-01-25 09:01:28.016404+00:00 | \n", "2023-01-25 09:01:12.348000+00:00 | \n", "2023-01-25 09:01:28.016404+00:00 | \n", "2023-01-25 09:01:18.959000+00:00 | \n", "
2 | \n", "10 | \n", "2023-01-25 09:41:04.989000+00:00 | \n", "2023-01-25 09:41:14.083000+00:00 | \n", "2023-01-25 09:41:20.676132+00:00 | \n", "2023-01-25 09:41:04.989000+00:00 | \n", "2023-01-25 09:41:20.676132+00:00 | \n", "2023-01-25 09:41:11.580000+00:00 | \n", "
3 | \n", "100 | \n", "2023-01-25 16:48:32.712000+00:00 | \n", "2023-01-25 16:48:42.294000+00:00 | \n", "2023-01-25 16:48:47.714735+00:00 | \n", "2023-01-25 16:48:32.712000+00:00 | \n", "2023-01-25 16:48:47.714735+00:00 | \n", "2023-01-25 16:48:38.129000+00:00 | \n", "
4 | \n", "1000 | \n", "2023-02-08 12:01:59.993000+00:00 | \n", "2023-02-08 12:02:10.483000+00:00 | \n", "2023-02-08 12:02:16.848774+00:00 | \n", "2023-02-08 12:01:59.993000+00:00 | \n", "2023-02-08 12:02:16.848774+00:00 | \n", "2023-02-08 12:02:06.355000+00:00 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
9994 | \n", "9994 | \n", "2023-06-19 12:25:33.362000+00:00 | \n", "2023-06-19 12:25:43.787000+00:00 | \n", "2023-06-19 12:25:50.615538+00:00 | \n", "2023-06-19 12:25:33.362000+00:00 | \n", "2023-06-19 12:25:50.615538+00:00 | \n", "2023-06-19 12:25:40.188000+00:00 | \n", "
9995 | \n", "9995 | \n", "2023-06-19 12:25:55.764000+00:00 | \n", "2023-06-19 12:26:05.662000+00:00 | \n", "2023-06-19 12:26:11.965755+00:00 | \n", "2023-06-19 12:25:55.764000+00:00 | \n", "2023-06-19 12:26:11.965755+00:00 | \n", "2023-06-19 12:26:02.064000+00:00 | \n", "
9996 | \n", "9996 | \n", "2023-06-19 12:27:15.155000+00:00 | \n", "2023-06-19 12:27:25.548000+00:00 | \n", "2023-06-19 12:27:31.124483+00:00 | \n", "2023-06-19 12:27:15.155000+00:00 | \n", "2023-06-19 12:27:31.124483+00:00 | \n", "2023-06-19 12:27:20.729000+00:00 | \n", "
9997 | \n", "9997 | \n", "2023-06-19 12:30:28.224000+00:00 | \n", "2023-06-19 12:30:38.557000+00:00 | \n", "2023-06-19 12:30:44.296887+00:00 | \n", "2023-06-19 12:30:28.224000+00:00 | \n", "2023-06-19 12:30:44.296887+00:00 | \n", "2023-06-19 12:30:33.960000+00:00 | \n", "
9998 | \n", "9998 | \n", "2023-06-19 12:31:29.774000+00:00 | \n", "2023-06-19 12:31:40.249000+00:00 | \n", "2023-06-19 12:31:46.576142+00:00 | \n", "2023-06-19 12:31:29.774000+00:00 | \n", "2023-06-19 12:31:46.576142+00:00 | \n", "2023-06-19 12:31:36.099000+00:00 | \n", "
9999 rows × 7 columns
\n", "