{"nodes":[{"code":"import os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score\nimport random\nimport math\nimport matplotlib.pyplot as plt\n\n# Device handling (required)\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n# Experiment data structure\nexperiment_data = {\n    \"BPI2012\": {\n        \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n        \"losses\": {\"train\": [], \"val\": []},\n        \"predictions\": [],\n        \"ground_truth\": [],\n        \"epochs\": [],\n    },\n    \"BPI2017\": {\n        \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n        \"losses\": {\"train\": [], \"val\": []},\n        \"predictions\": [],\n        \"ground_truth\": [],\n        \"epochs\": [],\n    },\n    \"ROAD\": {\n        \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n        \"losses\": {\"train\": [], \"val\": []},\n        \"predictions\": [],\n        \"ground_truth\": [],\n        \"epochs\": [],\n    },\n}\n\n# Data loading utilities (use provided helper)\nfrom ai_scientist.ideas.my_research_topic import load_datasets, pick_default_dataset\n\n\n# Reproducibility\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# Build prefixes\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    # Keep only 'complete' transitions if lifecycle exists\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n        if len(df) == 0:\n            df = df.copy()  # fallback if empty\n            df = df.sort_values([\"case_id\", \"timestamp\"])\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    # Build activity vocab\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}  # 0 for PAD\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        # Convert to numpy arrays for safe positional indexing\n        ts_ns = (\n            pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy()\n        )  # nanoseconds\n        ts = (ts_ns // 10**9).astype(np.int64)  # seconds as numpy array\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str).tolist()], dtype=np.int64\n        )\n        # simple calendar features\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        # time deltas and since start in seconds\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(\n            np.float32\n        )  # [T,5]\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        # Generate prefixes of length k (min_prefix_len..min(max_prefix_len, T-1)); target = activity at position k\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            seq_acts = acts_ids[:k].tolist()\n            seq_feats = feats[:k]\n            target = int(acts_ids[k])\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": seq_acts,\n                    \"seq_feats\": seq_feats.copy(),\n                    \"target\": target,\n                    \"last_ts\": int(ts[k - 1]),\n                    \"next_ts\": int(ts[k]),\n                }\n            )\n\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n\n    # Collect feature normalization stats over all feats (initial; will be recomputed on train split)\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n    ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n    for s in samples:\n        if s[\"seq_feats\"].shape[0] > 0:\n            s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n            s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\n# Time-based split by case start time\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)  # includes PAD index\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)  # [B,T,emb]\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    out = {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, preds_probs = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            preds_probs.append(probs.detach().cpu().numpy())\n            # top-3 correctness\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys)\n    y_pred = np.array(preds_top1)\n    mask = y_true != pad_idx\n    y_true = y_true[mask]\n    y_pred = y_pred[mask]\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    probs_concat = (\n        np.concatenate(preds_probs, axis=0)\n        if len(preds_probs) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return avg_loss, acc, f1, top3, y_true, y_pred, probs_concat\n\n\ndef train_one_dataset(\n    name, df, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n):\n    print(f\"\\n=== Dataset: {name} ===\")\n    # Time-based split\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    # Build samples across all to get vocab; we'll re-normalize with train stats\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    # Filter per split\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # Recompute normalization using train samples only\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm_samples(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm_samples(samples_train)\n            norm_samples(samples_val)\n            norm_samples(samples_test)\n    print(\n        f\"Samples train/val/test: {len(samples_train)}/{len(samples_val)}/{len(samples_test)}; vocab={len(act2id)}\"\n    )\n    if len(samples_train) == 0 or len(act2id) < 2:\n        print(\"Not enough data to train. Skipping.\")\n        return\n    ds_train = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_val = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_test = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=True,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_test = DataLoader(\n        ds_test,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n\n    # Model\n    model = LSTMBaseline(\n        vocab_size=len(act2id),\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    # Training loop\n    best_val_top3 = -1.0\n    best_state = None\n    hist = {\"train_loss\": [], \"val_loss\": [], \"val_top3\": []}\n    for epoch in range(1, max_epochs + 1):\n        model.train()\n        total = 0\n        running_loss = 0.0\n        for batch in dl_train:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            optimizer.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item() * logits.size(0)\n            total += logits.size(0)\n        train_loss = running_loss / max(1, total)\n        val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n            model, dl_val, criterion, device, len(act2id), pad_id\n        )\n        print(\n            f\"Epoch {epoch}: validation_loss = {val_loss:.4f} | val_acc={val_acc:.4f} | val_f1={val_f1:.4f} | val_top3={val_top3:.4f}\"\n        )\n        hist[\"train_loss\"].append(train_loss)\n        hist[\"val_loss\"].append(val_loss)\n        hist[\"val_top3\"].append(val_top3)\n        experiment_data[name][\"losses\"][\"train\"].append((epoch, train_loss))\n        experiment_data[name][\"losses\"][\"val\"].append((epoch, val_loss))\n        experiment_data[name][\"metrics\"][\"val\"].append(\n            (epoch, {\"acc\": val_acc, \"macro_f1\": val_f1, \"top3\": val_top3})\n        )\n        experiment_data[name][\"epochs\"].append(epoch)\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_state = {k: v.cpu().clone() for k, v in model.state_dict().items()}\n\n    # Load best\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n\n    # Final eval on train/val/test\n    train_loss, train_acc, train_f1, train_top3, _, _, _ = evaluate(\n        model, dl_train, criterion, device, len(act2id), pad_id\n    )\n    val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n        model, dl_val, criterion, device, len(act2id), pad_id\n    )\n    test_loss, test_acc, test_f1, test_top3, y_true_t, y_pred_t, probs_t = evaluate(\n        model, dl_test, criterion, device, len(act2id), pad_id\n    )\n    print(\n        f\"[{name}] Train: loss={train_loss:.4f} acc={train_acc:.4f} f1={train_f1:.4f} top3={train_top3:.4f}\"\n    )\n    print(\n        f\"[{name}] Test:  loss={test_loss:.4f} acc={test_acc:.4f} f1={test_f1:.4f} top3={test_top3:.4f}\"\n    )\n\n    # Save metrics\n    experiment_data[name][\"metrics\"][\"train\"].append(\n        (\n            \"final\",\n            {\n                \"loss\": train_loss,\n                \"acc\": train_acc,\n                \"macro_f1\": train_f1,\n                \"top3\": train_top3,\n            },\n        )\n    )\n    experiment_data[name][\"metrics\"][\"val\"].append(\n        (\n            \"final\",\n            {\"loss\": val_loss, \"acc\": val_acc, \"macro_f1\": val_f1, \"top3\": val_top3},\n        )\n    )\n    experiment_data[name][\"metrics\"][\"test\"].append(\n        (\n            \"final\",\n            {\n                \"loss\": test_loss,\n                \"acc\": test_acc,\n                \"macro_f1\": test_f1,\n                \"top3\": test_top3,\n            },\n        )\n    )\n    experiment_data[name][\"predictions\"] = y_pred_t.tolist()\n    experiment_data[name][\"ground_truth\"] = y_true_t.tolist()\n\n    # Plots\n    try:\n        plt.figure()\n        plt.plot(hist[\"train_loss\"], label=\"train_loss\")\n        plt.plot(hist[\"val_loss\"], label=\"val_loss\")\n        plt.legend()\n        plt.title(f\"Loss Curves - {name}\")\n        plt.xlabel(\"Epoch\")\n        plt.ylabel(\"Loss\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"loss_curves_{name}.png\"))\n        plt.close()\n\n        plt.figure()\n        plt.plot(hist[\"val_top3\"], label=\"val_top3\")\n        plt.legend()\n        plt.title(f\"Val Top-3 Acc - {name}\")\n        plt.xlabel(\"Epoch\")\n        plt.ylabel(\"Top-3 Acc\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"val_top3_{name}.png\"))\n        plt.close()\n    except Exception as e:\n        print(f\"[warn] Plotting failed: {e}\")\n\n    # Save confusion matrix-like data (optional)\n    try:\n        from sklearn.metrics import confusion_matrix\n\n        cm = confusion_matrix(y_true_t, y_pred_t)\n        np.save(os.path.join(working_dir, f\"cm_{name}.npy\"), cm)\n    except Exception as e:\n        print(f\"[warn] Confusion matrix failed: {e}\")\n\n\ndef main():\n    datasets = load_datasets()\n    # Loop through loaded datasets; cap to 5000 earliest cases for speed\n    for key, df in datasets.items():\n        try:\n            starts = (\n                df.sort_values(\"timestamp\")\n                .groupby(\"case_id\")[\"timestamp\"]\n                .min()\n                .reset_index()\n            )\n            if len(starts) > 5000:\n                keep_cases = set(starts.iloc[:5000][\"case_id\"])\n                df_small = df[df[\"case_id\"].isin(keep_cases)].copy()\n            else:\n                df_small = df\n        except Exception:\n            df_small = df\n        train_one_dataset(\n            key, df_small, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n        )\n    # Save experiment data\n    np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n    np.savez_compressed(\n        os.path.join(working_dir, \"experiment_data_compressed.npz\"),\n        data=experiment_data,\n    )\n\n\n# Execute immediately\nmain()\n","plan":"The crash arises because timestamps within each case were kept as a pandas Series and indexed with integer labels, which pandas interprets as label-based indexing; for non-RangeIndex groups, accessing ts[k] raises KeyError. I fix this by converting timestamps to a dense numpy array (ts = ... .to_numpy()), ensuring positional indexing. I also make the prefix generation loop explicitly stop at T-1 to guarantee the existence of a next event, preventing off-by-one mistakes. The rest of the pipeline remains intact: time-based split by case start, prefix features, a simple LSTM baseline, and required BPM metrics and saving.","overall_plan":"","plot_code":"import matplotlib.pyplot as plt\nimport numpy as np\nimport os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import (\n    f1_score,\n    accuracy_score,\n    confusion_matrix,\n    precision_recall_curve,\n    average_precision_score,\n)\nfrom sklearn.preprocessing import label_binarize\nimport random\nimport math\nfrom collections import defaultdict\n\n# Reproducibility and device\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# --------- Data loading from local XES via pm4py ----------\ndef load_xes_folder(data_dir=\"data\"):\n    datasets = {}\n    try:\n        import pm4py\n    except Exception as e:\n        print(f\"pm4py not available: {e}\")\n        return datasets\n    if not os.path.isdir(data_dir):\n        print(f\"Data directory not found: {data_dir}\")\n        return datasets\n    for fn in os.listdir(data_dir):\n        if fn.lower().endswith(\".xes\") or fn.lower().endswith(\".xes.gz\"):\n            path = os.path.join(data_dir, fn)\n            try:\n                log = pm4py.read_xes(path)\n                df = pm4py.convert_to_dataframe(log)\n                # Standardize columns\n                # pm4py dataframe typically has case:concept:name, concept:name, time:timestamp, lifecycle:transition\n                cols = df.columns\n                case_col = (\n                    \"case:concept:name\"\n                    if \"case:concept:name\" in cols\n                    else (\"case\" if \"case\" in cols else None)\n                )\n                act_col = (\n                    \"concept:name\"\n                    if \"concept:name\" in cols\n                    else (\"activity\" if \"activity\" in cols else None)\n                )\n                ts_col = (\n                    \"time:timestamp\"\n                    if \"time:timestamp\" in cols\n                    else (\"timestamp\" if \"timestamp\" in cols else None)\n                )\n                life_col = (\n                    \"lifecycle:transition\"\n                    if \"lifecycle:transition\" in cols\n                    else (\"lifecycle\" if \"lifecycle\" in cols else None)\n                )\n                if case_col is None or act_col is None or ts_col is None:\n                    print(f\"Missing required columns in {fn}, skipping.\")\n                    continue\n                out = pd.DataFrame(\n                    {\n                        \"case_id\": df[case_col].astype(str).values,\n                        \"activity\": df[act_col].astype(str).values,\n                        \"timestamp\": pd.to_datetime(df[ts_col], utc=True),\n                    }\n                )\n                if life_col is not None:\n                    out[\"lifecycle\"] = df[life_col].astype(str).values\n                name = os.path.splitext(fn)[0]\n                datasets[name] = out\n                print(\n                    f\"Loaded {name}: {len(out)} events, {out['case_id'].nunique()} cases\"\n                )\n            except Exception as e:\n                print(f\"Failed to load {fn}: {e}\")\n    return datasets\n\n\n# --------- Prefix building and split ----------\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        mask = df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")\n        if mask.any():\n            df = df[mask]\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        if len(g) < 2:\n            continue\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        ts = (g_ts.astype(\"int64\") // 10**9).to_numpy(np.int64)\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str)], dtype=np.int64\n        )\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": acts_ids[:k].tolist(),\n                    \"seq_feats\": feats[:k].copy(),\n                    \"target\": int(acts_ids[k]),\n                    \"prefix_len\": k,\n                }\n            )\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    for s in samples:\n        pass  # initial no norm; will norm on train split\n    return samples, act2id, id2act, pad_id\n\n\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.vstack(\n            [\n                np.zeros((pad_len, self.num_cont), dtype=np.float32),\n                feats.astype(np.float32),\n            ]\n        )\n        attn = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad).long(),\n            \"feats\": torch.tensor(feats_pad).float(),\n            \"mask\": torch.tensor(attn).float(),\n            \"y\": torch.tensor(s[\"target\"]).long(),\n            \"prefix_len\": L,\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, pad_idx=0):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim, hidden_size=hidden, batch_first=True\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h = self.dropout(h[-1])\n        return self.fc(h)\n\n\ndef collate_fn(batch):\n    out = {\n        k: (\n            torch.stack([b[k] for b in batch], 0)\n            if isinstance(batch[0][k], torch.Tensor)\n            else [b[k] for b in batch]\n        )\n        for k in batch[0].keys()\n    }\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys = []\n    yhat = []\n    probs_list = []\n    n = 0\n    top3_correct = 0\n    pref_lens = []\n    top3_flags = []\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) if isinstance(v, torch.Tensor) else v\n                for k, v in batch.items()\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk = torch.topk(probs, k=k_val, dim=1)\n            y = batch[\"y\"]\n            ys.extend(y.detach().cpu().tolist())\n            yhat.extend(top1.detach().cpu().tolist())\n            probs_list.append(probs.detach().cpu().numpy())\n            for i in range(y.size(0)):\n                flag = int(y[i].item() in topk[i].detach().cpu().tolist())\n                top3_correct += flag\n                top3_flags.append(flag)\n                pref_lens.append(int(batch[\"prefix_len\"][i].item()))\n            n += y.size(0)\n    avg_loss = total_loss / max(1, n)\n    y_true = np.array(ys)\n    y_pred = np.array(yhat)\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n))\n    probs_concat = (\n        np.concatenate(probs_list, axis=0)\n        if len(probs_list) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return (\n        avg_loss,\n        acc,\n        f1,\n        top3,\n        y_true,\n        y_pred,\n        probs_concat,\n        np.array(pref_lens),\n        np.array(top3_flags),\n    )\n\n\ndef train_on_dataset(\n    name, df, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n):\n    print(f\"\\n=== Dataset: {name} ===\")\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    s_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    s_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    s_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # normalize time features on train\n    if len(s_train) > 0:\n        feats = np.concatenate(\n            [s[\"seq_feats\"] for s in s_train if len(s[\"seq_feats\"]) > 0], axis=0\n        )\n        dt_mean, dt_std = feats[:, 0].mean(), feats[:, 0].std() + 1e-6\n        ss_mean, ss_std = feats[:, 1].mean(), feats[:, 1].std() + 1e-6\n\n        def norm(samples):\n            for s in samples:\n                if s[\"seq_feats\"].shape[0] > 0:\n                    s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                    s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n        norm(s_train)\n        norm(s_val)\n        norm(s_test)\n    print(\n        f\"Samples train/val/test: {len(s_train)}/{len(s_val)}/{len(s_test)}; vocab={len(act2id)}\"\n    )\n    if len(s_train) == 0 or len(act2id) < 2:\n        print(\"Insufficient data; skipping.\")\n        return None\n    ds_tr = PrefixDataset(s_train, pad_id, max_prefix_len, 5)\n    ds_va = PrefixDataset(s_val, pad_id, max_prefix_len, 5)\n    ds_te = PrefixDataset(s_test, pad_id, max_prefix_len, 5)\n    dl_tr = DataLoader(\n        ds_tr, batch_size=batch_size, shuffle=True, collate_fn=collate_fn\n    )\n    dl_va = DataLoader(\n        ds_va, batch_size=batch_size, shuffle=False, collate_fn=collate_fn\n    )\n    dl_te = DataLoader(\n        ds_te, batch_size=batch_size, shuffle=False, collate_fn=collate_fn\n    )\n    model = LSTMBaseline(\n        vocab_size=len(act2id), emb_dim=64, cont_dim=5, hidden=128, pad_idx=pad_id\n    ).to(device)\n    crit = nn.CrossEntropyLoss().to(device)\n    opt = torch.optim.Adam(model.parameters(), lr=lr)\n    best_top3 = -1.0\n    best_state = None\n    history = {\"train_loss\": [], \"val_loss\": [], \"val_top3\": []}\n    for ep in range(1, max_epochs + 1):\n        model.train()\n        tot = 0\n        run_loss = 0.0\n        for batch in dl_tr:\n            batch = {\n                k: v.to(device) if isinstance(v, torch.Tensor) else v\n                for k, v in batch.items()\n            }\n            opt.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = crit(logits, batch[\"y\"])\n            loss.backward()\n            opt.step()\n            run_loss += loss.item() * logits.size(0)\n            tot += logits.size(0)\n        tr_loss = run_loss / max(1, tot)\n        va_loss, va_acc, va_f1, va_top3, *_ = evaluate(\n            model, dl_va, crit, device, len(act2id), pad_id\n        )\n        print(\n            f\"Epoch {ep}: val_loss={va_loss:.4f} acc={va_acc:.4f} f1={va_f1:.4f} top3={va_top3:.4f}\"\n        )\n        history[\"train_loss\"].append(tr_loss)\n        history[\"val_loss\"].append(va_loss)\n        history[\"val_top3\"].append(va_top3)\n        if va_top3 > best_top3:\n            best_top3 = va_top3\n            best_state = {\n                k: v.detach().cpu().clone() for k, v in model.state_dict().items()\n            }\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n    tr_loss, tr_acc, tr_f1, tr_top3, *_ = evaluate(\n        model, dl_tr, crit, device, len(act2id), pad_id\n    )\n    te_loss, te_acc, te_f1, te_top3, y_true, y_pred, probs, pref_lens, top3_flags = (\n        evaluate(model, dl_te, crit, device, len(act2id), pad_id)\n    )\n    print(\n        f\"[{name}] Test: loss={te_loss:.4f} acc={te_acc:.4f} f1={te_f1:.4f} top3={te_top3:.4f}\"\n    )\n    # package experiment data\n    exp = {\n        \"metrics\": {\n            \"train\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": tr_loss,\n                        \"acc\": tr_acc,\n                        \"macro_f1\": tr_f1,\n                        \"top3\": tr_top3,\n                    },\n                )\n            ],\n            \"val\": [],\n            \"test\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": te_loss,\n                        \"acc\": te_acc,\n                        \"macro_f1\": te_f1,\n                        \"top3\": te_top3,\n                    },\n                )\n            ],\n        },\n        \"losses\": {\n            \"train\": list(enumerate(history[\"train_loss\"], start=1)),\n            \"val\": list(enumerate(history[\"val_loss\"], start=1)),\n        },\n        \"predictions\": y_pred.tolist(),\n        \"ground_truth\": y_true.tolist(),\n        \"epochs\": list(range(1, len(history[\"train_loss\"]) + 1)),\n        \"probs\": probs,\n        \"prefix_lens\": pref_lens.tolist(),\n        \"top3_flags\": top3_flags.tolist(),\n        \"act2id\": act2id,\n    }\n    # plots for this dataset\n    try:\n        plt.figure()\n        plt.plot(history[\"train_loss\"], label=\"train\")\n        plt.plot(history[\"val_loss\"], label=\"val\")\n        plt.legend()\n        plt.title(f\"Loss Curves - {name}\")\n        plt.xlabel(\"Epoch\")\n        plt.ylabel(\"Loss\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"{name}_loss_curves.png\"))\n        plt.close()\n    except Exception as e:\n        print(f\"Error creating loss curves for {name}: {e}\")\n        plt.close()\n    try:\n        cm = confusion_matrix(y_true, y_pred)\n        plt.figure(figsize=(5, 4))\n        plt.imshow(cm, aspect=\"auto\", cmap=\"Blues\")\n        plt.colorbar()\n        plt.title(f\"Confusion Matrix (Test) - {name}\\nNext-activity\")\n        plt.xlabel(\"Predicted\")\n        plt.ylabel(\"True\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"{name}_confusion_matrix.png\"))\n        plt.close()\n    except Exception as e:\n        print(f\"Error creating confusion matrix for {name}: {e}\")\n        plt.close()\n    try:\n        # Top-3 accuracy vs prefix length\n        if len(pref_lens) > 0:\n            d = defaultdict(list)\n            for L, flag in zip(pref_lens, top3_flags):\n                d[int(L)].append(int(flag))\n            xs = sorted(d.keys())\n            ys = [np.mean(d[k]) for k in xs]\n            plt.figure()\n            plt.plot(xs, ys, marker=\"o\")\n            plt.title(f\"Top-3 Accuracy vs Prefix Length - {name}\\nNext-activity\")\n            plt.xlabel(\"Prefix Length\")\n            plt.ylabel(\"Top-3 Accuracy\")\n            plt.tight_layout()\n            plt.savefig(os.path.join(working_dir, f\"{name}_top3_vs_prefixlen.png\"))\n            plt.close()\n    except Exception as e:\n        print(f\"Error creating Top-3 vs prefix length for {name}: {e}\")\n        plt.close()\n    try:\n        # Macro PR curve (one-vs-rest); may be coarse due to many classes\n        if probs.shape[0] > 0:\n            classes = np.unique(y_true)\n            Y = label_binarize(y_true, classes=range(probs.shape[1]))\n            # only keep columns present in classes to avoid PAD\n            present = [c for c in classes]\n            if len(present) > 1:\n                precisions = []\n                recalls = []\n                aps = []\n                for c in present:\n                    p, r, _ = precision_recall_curve(Y[:, c], probs[:, c])\n                    ap = average_precision_score(Y[:, c], probs[:, c])\n                    precisions.append(\n                        np.interp(np.linspace(0, 1, 101), r[::-1], p[::-1])\n                    )\n                    recalls.append(np.linspace(0, 1, 101))\n                    aps.append(ap)\n                macro_p = np.mean(np.stack(precisions, 0), 0)\n                macro_r = np.linspace(0, 1, 101)\n                plt.figure()\n                plt.plot(macro_r, macro_p, label=f\"Macro-PR (mAP={np.mean(aps):.3f})\")\n                plt.title(f\"Macro Precision-Recall (Test) - {name}\\nNext-activity\")\n                plt.xlabel(\"Recall\")\n                plt.ylabel(\"Precision\")\n                plt.legend()\n                plt.tight_layout()\n                plt.savefig(os.path.join(working_dir, f\"{name}_macro_pr.png\"))\n                plt.close()\n    except Exception as e:\n        print(f\"Error creating PR curve for {name}: {e}\")\n        plt.close()\n    return name, exp\n\n\ndef main():\n    datasets = load_xes_folder(data_dir=os.path.join(os.getcwd(), \"data\"))\n    experiment_data = {}\n    for name, df in datasets.items():\n        # optional cap earliest 5000 cases\n        try:\n            starts = (\n                df.sort_values(\"timestamp\")\n                .groupby(\"case_id\")[\"timestamp\"]\n                .min()\n                .reset_index()\n            )\n            if len(starts) > 5000:\n                keep = set(starts.iloc[:5000][\"case_id\"])\n                df = df[df[\"case_id\"].isin(keep)].copy()\n        except:\n            pass\n        res = train_on_dataset(\n            name, df, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n        )\n        if res is not None:\n            k, exp = res\n            experiment_data[k] = exp\n    # Save experiment data\n    np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n    # Print evaluation metrics\n    for k, v in experiment_data.items():\n        test_metrics = dict(v[\"metrics\"][\"test\"][0][1])\n        print(\n            f\"{k} | Test acc={test_metrics['acc']:.4f} macro_f1={test_metrics['macro_f1']:.4f} top3={test_metrics['top3']:.4f} loss={test_metrics['loss']:.4f}\"\n        )\n\n    # Secondary plotting pass strictly from experiment_data.npy (as required)\n    try:\n        experiment_data_loaded = np.load(\n            os.path.join(working_dir, \"experiment_data.npy\"), allow_pickle=True\n        ).item()\n    except Exception as e:\n        print(f\"Error loading experiment data: {e}\")\n        experiment_data_loaded = {}\n    for name, ed in experiment_data_loaded.items():\n        try:\n            # re-plot loss curves from saved data\n            plt.figure()\n            tl = [y for (_, y) in ed.get(\"losses\", {}).get(\"train\", [])]\n            vl = [y for (_, y) in ed.get(\"losses\", {}).get(\"val\", [])]\n            if len(tl) > 0:\n                plt.plot(tl, label=\"train\")\n            if len(vl) > 0:\n                plt.plot(vl, label=\"val\")\n            plt.legend()\n            plt.title(f\"Loss Curves - {name}\\nNext-activity\")\n            plt.xlabel(\"Epoch\")\n            plt.ylabel(\"Loss\")\n            plt.tight_layout()\n            plt.savefig(os.path.join(working_dir, f\"{name}_loss_curves_reload.png\"))\n            plt.close()\n        except Exception as e:\n            print(f\"Error creating plot1: {e}\")\n            plt.close()\n        try:\n            # confusion matrix from predictions and ground truth\n            y_true = ed.get(\"ground_truth\", [])\n            y_pred = ed.get(\"predictions\", [])\n            if len(y_true) > 0 and len(y_pred) > 0:\n                cm = confusion_matrix(y_true, y_pred)\n                plt.figure(figsize=(5, 4))\n                plt.imshow(cm, aspect=\"auto\", cmap=\"Blues\")\n                plt.colorbar()\n                plt.title(f\"Confusion Matrix (Test) - {name}\\nNext-activity\")\n                plt.xlabel(\"Predicted\")\n                plt.ylabel(\"True\")\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(working_dir, f\"{name}_confusion_matrix_reload.png\")\n                )\n                plt.close()\n        except Exception as e:\n            print(f\"Error creating plot2: {e}\")\n            plt.close()\n        try:\n            # Top-3 vs prefix length if present\n            pref = ed.get(\"prefix_lens\", [])\n            flags = ed.get(\"top3_flags\", [])\n            if len(pref) > 0 and len(flags) > 0:\n                d = defaultdict(list)\n                for L, f in zip(pref, flags):\n                    d[int(L)].append(int(f))\n                xs = sorted(d.keys())\n                ys = [float(np.mean(d[x])) for x in xs]\n                plt.figure()\n                plt.plot(xs, ys, marker=\"o\")\n                plt.title(f\"Top-3 Accuracy vs Prefix Length - {name}\\nNext-activity\")\n                plt.xlabel(\"Prefix Length\")\n                plt.ylabel(\"Top-3 Accuracy\")\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(working_dir, f\"{name}_top3_vs_prefixlen_reload.png\")\n                )\n                plt.close()\n        except Exception as e:\n            print(f\"Error creating plot3: {e}\")\n            plt.close()\n        try:\n            # Macro PR curve if probs available\n            probs = np.array(ed.get(\"probs\", []))\n            y_true = ed.get(\"ground_truth\", [])\n            if probs.size > 0 and len(y_true) > 0:\n                classes = sorted(set(y_true))\n                Y = label_binarize(np.array(y_true), classes=range(probs.shape[1]))\n                present = classes\n                if len(present) > 1:\n                    precisions = []\n                    aps = []\n                    grid = np.linspace(0, 1, 101)\n                    for c in present:\n                        p, r, _ = precision_recall_curve(Y[:, c], probs[:, c])\n                        precisions.append(np.interp(grid, r[::-1], p[::-1]))\n                        aps.append(average_precision_score(Y[:, c], probs[:, c]))\n                    macro_p = np.mean(np.stack(precisions, 0), 0)\n                    plt.figure()\n                    plt.plot(grid, macro_p, label=f\"mAP={np.mean(aps):.3f}\")\n                    plt.title(f\"Macro Precision-Recall (Test) - {name}\\nNext-activity\")\n                    plt.xlabel(\"Recall\")\n                    plt.ylabel(\"Precision\")\n                    plt.legend()\n                    plt.tight_layout()\n                    plt.savefig(\n                        os.path.join(working_dir, f\"{name}_macro_pr_reload.png\")\n                    )\n                    plt.close()\n        except Exception as e:\n            print(f\"Error creating plot4: {e}\")\n            plt.close()\n\n\nif __name__ == \"__main__\":\n    main()\n","plot_plan":"We tackle next-activity prediction from local XES logs using pm4py, building time-ordered prefixes and splitting cases by start time into train/val/test. Activities are tokenized and simple temporal/calendar features are added; a small LSTM consumes past activities plus features to predict the next activity. We train for a few epochs, select the best model by validation Top-3 accuracy, then evaluate on test with accuracy, macro-F1, Top-3, and confusion matrix; we also keep per-sample prefix lengths to compute Top-3 vs prefix length. We aggregate results into an experiment_data object and save it. Finally, we generate standard plots only from the saved experiment_data: loss curves, confusion matrix, macro-PR if probabilities exist, and Top-3 vs prefix length. We ensure each plot is guarded with try-except and saved to working_dir, closing figures after saving. The code uses pm4py to load any local .xes files, avoids external datasets, performs time-based splits, and reports BPM metrics.","step":0,"id":"726b2721d45c4800b9381c5d265fefcb","ctime":1757756714.9796784,"_term_out":["Using device: cuda","\n","[data] Using discovered data dir: /workspace/data","\n","[data] Available in /workspace/data: ['BPI_Challenge_2012.xes', 'BPI_Challenge_2017.xes', 'Road_Traffic_Fine_Management_Process.xes']","\n","[data] Loading XES: /workspace/data/BPI_Challenge_2012.xes","\n","\rparsing log, completed traces ::   0%|          | 0/13087 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 1/13087 [00:00<22:13,  9.81it/s]","\rparsing log, completed traces ::   1%|1         | 155/13087 [00:00<00:14, 902.77it/s]","\rparsing log, completed traces ::   2%|2         | 307/13087 [00:00<00:10, 1183.23it/s]","\rparsing log, completed traces ::   4%|3         | 475/13087 [00:00<00:09, 1374.93it/s]","\rparsing log, completed traces ::   5%|4         | 632/13087 [00:00<00:08, 1441.90it/s]","\rparsing log, completed traces ::   6%|5         | 777/13087 [00:00<00:15, 819.10it/s] ","\rparsing log, completed traces ::   7%|7         | 927/13087 [00:00<00:12, 964.33it/s]","\rparsing log, completed traces ::   8%|8         | 1092/13087 [00:01<00:10, 1124.33it/s]","\rparsing log, completed traces ::  10%|9         | 1260/13087 [00:01<00:09, 1261.95it/s]","\rparsing log, completed traces ::  11%|#1        | 1456/13087 [00:01<00:08, 1445.90it/s]","\rparsing log, completed traces ::  12%|#2        | 1635/13087 [00:01<00:07, 1535.07it/s]","\rparsing log, completed traces ::  14%|#3        | 1809/13087 [00:01<00:07, 1587.27it/s]","\rparsing log, completed traces ::  15%|#5        | 1977/13087 [00:01<00:07, 1564.32it/s]","\rparsing log, completed traces ::  16%|#6        | 2142/13087 [00:01<00:06, 1586.66it/s]","\rparsing log, completed traces ::  18%|#7        | 2311/13087 [00:01<00:06, 1614.55it/s]","\rparsing log, completed traces ::  19%|#9        | 2499/13087 [00:01<00:06, 1691.18it/s]","\rparsing log, completed traces ::  20%|##        | 2671/13087 [00:01<00:06, 1682.60it/s]","\rparsing log, completed traces ::  22%|##1       | 2842/13087 [00:02<00:06, 1609.51it/s]","\rparsing log, completed traces ::  23%|##2       | 3005/13087 [00:02<00:10, 939.23it/s] ","\rparsing log, completed traces ::  24%|##4       | 3153/13087 [00:02<00:09, 1042.68it/s]","\rparsing log, completed traces ::  26%|##5       | 3396/13087 [00:02<00:07, 1339.99it/s]","\rparsing log, completed traces ::  27%|##7       | 3575/13087 [00:02<00:06, 1442.75it/s]","\rparsing log, completed traces ::  29%|##8       | 3764/13087 [00:02<00:05, 1554.54it/s]","\rparsing log, completed traces ::  30%|###       | 3945/13087 [00:02<00:05, 1621.59it/s]","\rparsing log, completed traces ::  32%|###1      | 4186/13087 [00:03<00:04, 1836.31it/s]","\rparsing log, completed traces ::  34%|###3      | 4403/13087 [00:03<00:04, 1924.51it/s]","\rparsing log, completed traces ::  35%|###5      | 4608/13087 [00:03<00:04, 1960.03it/s]","\rparsing log, completed traces ::  37%|###6      | 4811/13087 [00:03<00:04, 1910.52it/s]","\rparsing log, completed traces ::  38%|###8      | 5012/13087 [00:03<00:04, 1938.09it/s]","\rparsing log, completed traces ::  40%|###9      | 5210/13087 [00:03<00:04, 1865.51it/s]","\rparsing log, completed traces ::  41%|####1     | 5400/13087 [00:03<00:04, 1822.65it/s]","\rparsing log, completed traces ::  43%|####2     | 5585/13087 [00:03<00:04, 1711.36it/s]","\rparsing log, completed traces ::  44%|####4     | 5764/13087 [00:03<00:04, 1726.93it/s]","\rparsing log, completed traces ::  45%|####5     | 5939/13087 [00:04<00:07, 943.97it/s] ","\rparsing log, completed traces ::  47%|####6     | 6102/13087 [00:04<00:06, 1066.47it/s]","\rparsing log, completed traces ::  48%|####8     | 6284/13087 [00:04<00:05, 1219.00it/s]","\rparsing log, completed traces ::  50%|####9     | 6481/13087 [00:04<00:04, 1381.28it/s]","\rparsing log, completed traces ::  51%|#####     | 6648/13087 [00:04<00:04, 1440.78it/s]","\rparsing log, completed traces ::  52%|#####2    | 6813/13087 [00:04<00:04, 1491.87it/s]","\rparsing log, completed traces ::  53%|#####3    | 6978/13087 [00:04<00:04, 1478.08it/s]","\rparsing log, completed traces ::  55%|#####4    | 7150/13087 [00:05<00:03, 1542.98it/s]","\rparsing log, completed traces ::  56%|#####5    | 7313/13087 [00:05<00:03, 1554.25it/s]","\rparsing log, completed traces ::  57%|#####7    | 7475/13087 [00:05<00:03, 1511.56it/s]","\rparsing log, completed traces ::  58%|#####8    | 7631/13087 [00:05<00:03, 1506.49it/s]","\rparsing log, completed traces ::  60%|#####9    | 7795/13087 [00:05<00:03, 1542.51it/s]","\rparsing log, completed traces ::  61%|######    | 7952/13087 [00:05<00:03, 1522.31it/s]","\rparsing log, completed traces ::  62%|######2   | 8125/13087 [00:05<00:03, 1574.39it/s]","\rparsing log, completed traces ::  63%|######3   | 8305/13087 [00:05<00:02, 1638.91it/s]","\rparsing log, completed traces ::  65%|######4   | 8476/13087 [00:05<00:02, 1659.72it/s]","\rparsing log, completed traces ::  66%|######6   | 8645/13087 [00:05<00:02, 1666.27it/s]","\rparsing log, completed traces ::  67%|######7   | 8813/13087 [00:06<00:02, 1653.27it/s]","\rparsing log, completed traces ::  69%|######8   | 8979/13087 [00:06<00:04, 844.36it/s] ","\rparsing log, completed traces ::  70%|######9   | 9120/13087 [00:06<00:04, 943.26it/s]","\rparsing log, completed traces ::  71%|#######1  | 9308/13087 [00:06<00:03, 1131.69it/s]","\rparsing log, completed traces ::  72%|#######2  | 9471/13087 [00:06<00:02, 1241.38it/s]","\rparsing log, completed traces ::  74%|#######3  | 9624/13087 [00:06<00:02, 1280.12it/s]","\rparsing log, completed traces ::  75%|#######4  | 9787/13087 [00:06<00:02, 1365.32it/s]","\rparsing log, completed traces ::  76%|#######6  | 9950/13087 [00:07<00:02, 1433.72it/s]","\rparsing log, completed traces ::  77%|#######7  | 10112/13087 [00:07<00:02, 1482.43it/s]","\rparsing log, completed traces ::  78%|#######8  | 10270/13087 [00:07<00:01, 1492.40it/s]","\rparsing log, completed traces ::  80%|#######9  | 10426/13087 [00:07<00:01, 1495.09it/s]","\rparsing log, completed traces ::  81%|########  | 10580/13087 [00:07<00:01, 1456.05it/s]","\rparsing log, completed traces ::  82%|########2 | 10761/13087 [00:07<00:01, 1552.73it/s]","\rparsing log, completed traces ::  84%|########3 | 10946/13087 [00:07<00:01, 1636.64it/s]","\rparsing log, completed traces ::  85%|########4 | 11121/13087 [00:07<00:01, 1667.60it/s]","\rparsing log, completed traces ::  86%|########6 | 11295/13087 [00:07<00:01, 1683.98it/s]","\rparsing log, completed traces ::  88%|########7 | 11497/13087 [00:08<00:00, 1780.59it/s]","\rparsing log, completed traces ::  89%|########9 | 11677/13087 [00:08<00:00, 1764.28it/s]","\rparsing log, completed traces ::  91%|######### | 11879/13087 [00:08<00:00, 1839.23it/s]","\rparsing log, completed traces ::  92%|#########2| 12064/13087 [00:08<00:00, 1838.87it/s]","\rparsing log, completed traces ::  94%|#########3| 12278/13087 [00:08<00:00, 1928.19it/s]","\rparsing log, completed traces ::  95%|#########5| 12472/13087 [00:08<00:00, 879.69it/s] ","\rparsing log, completed traces ::  97%|#########6| 12671/13087 [00:09<00:00, 1058.76it/s]","\rparsing log, completed traces ::  98%|#########8| 12863/13087 [00:09<00:00, 1218.85it/s]","\rparsing log, completed traces :: 100%|#########9| 13065/13087 [00:09<00:00, 1387.49it/s]","","\rparsing log, completed traces :: 100%|##########| 13087/13087 [00:09<00:00, 1419.98it/s]","\n","[data] Loading XES: /workspace/data/BPI_Challenge_2017.xes","\n","\rparsing log, completed traces ::   0%|          | 0/31509 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 1/31509 [00:00<4:44:28,  1.85it/s]","\rparsing log, completed traces ::   0%|          | 68/31509 [00:00<03:43, 140.65it/s]","\rparsing log, completed traces ::   0%|          | 126/31509 [00:00<02:10, 240.46it/s]","\rparsing log, completed traces ::   1%|          | 194/31509 [00:00<01:29, 348.13it/s]","\rparsing log, completed traces ::   1%|          | 254/31509 [00:00<01:15, 412.78it/s]","\rparsing log, completed traces ::   1%|1         | 318/31509 [00:01<01:06, 472.43it/s]","\rparsing log, completed traces ::   1%|1         | 382/31509 [00:01<01:00, 518.19it/s]","\rparsing log, completed traces ::   1%|1         | 443/31509 [00:01<00:57, 538.22it/s]","\rparsing log, completed traces ::   2%|1         | 507/31509 [00:01<00:54, 566.63it/s]","\rparsing log, completed traces ::   2%|1         | 569/31509 [00:01<00:54, 565.64it/s]","\rparsing log, completed traces ::   2%|2         | 635/31509 [00:01<00:52, 591.58it/s]","\rparsing log, completed traces ::   2%|2         | 707/31509 [00:01<00:49, 626.99it/s]","\rparsing log, completed traces ::   2%|2         | 772/31509 [00:01<00:48, 628.07it/s]","\rparsing log, completed traces ::   3%|2         | 837/31509 [00:01<00:49, 615.97it/s]","\rparsing log, completed traces ::   3%|2         | 901/31509 [00:01<00:49, 619.32it/s]","\rparsing log, completed traces ::   3%|3         | 973/31509 [00:02<00:47, 646.04it/s]","\rparsing log, completed traces ::   3%|3         | 1039/31509 [00:02<00:46, 648.56it/s]","\rparsing log, completed traces ::   4%|3         | 1105/31509 [00:02<00:47, 635.62it/s]","\rparsing log, completed traces ::   4%|3         | 1172/31509 [00:02<00:47, 644.40it/s]","\rparsing log, completed traces ::   4%|3         | 1241/31509 [00:02<00:46, 654.84it/s]","\rparsing log, completed traces ::   4%|4         | 1307/31509 [00:02<00:46, 649.07it/s]","\rparsing log, completed traces ::   4%|4         | 1374/31509 [00:02<00:46, 653.26it/s]","\rparsing log, completed traces ::   5%|4         | 1440/31509 [00:03<01:27, 343.66it/s]","\rparsing log, completed traces ::   5%|4         | 1502/31509 [00:03<01:16, 392.03it/s]","\rparsing log, completed traces ::   5%|4         | 1568/31509 [00:03<01:07, 446.03it/s]","\rparsing log, completed traces ::   5%|5         | 1633/31509 [00:03<01:00, 490.91it/s]","\rparsing log, completed traces ::   5%|5         | 1694/31509 [00:03<00:57, 517.11it/s]","\rparsing log, completed traces ::   6%|5         | 1759/31509 [00:03<00:53, 551.06it/s]","\rparsing log, completed traces ::   6%|5         | 1821/31509 [00:03<00:53, 556.22it/s]","\rparsing log, completed traces ::   6%|5         | 1881/31509 [00:03<00:52, 565.73it/s]","\rparsing log, completed traces ::   6%|6         | 1946/31509 [00:03<00:50, 587.82it/s]","\rparsing log, completed traces ::   6%|6         | 2011/31509 [00:04<00:48, 603.34it/s]","\rparsing log, completed traces ::   7%|6         | 2074/31509 [00:04<00:48, 609.16it/s]","\rparsing log, completed traces ::   7%|6         | 2138/31509 [00:04<00:47, 617.99it/s]","\rparsing log, completed traces ::   7%|6         | 2201/31509 [00:04<00:47, 621.42it/s]","\rparsing log, completed traces ::   7%|7         | 2272/31509 [00:04<00:45, 645.06it/s]","\rparsing log, completed traces ::   7%|7         | 2338/31509 [00:04<00:45, 647.48it/s]","\rparsing log, completed traces ::   8%|7         | 2404/31509 [00:04<00:45, 644.97it/s]","\rparsing log, completed traces ::   8%|7         | 2471/31509 [00:04<00:44, 646.03it/s]","\rparsing log, completed traces ::   8%|8         | 2536/31509 [00:05<01:22, 351.71it/s]","\rparsing log, completed traces ::   8%|8         | 2610/31509 [00:05<01:08, 423.18it/s]","\rparsing log, completed traces ::   8%|8         | 2677/31509 [00:05<01:00, 473.98it/s]","\rparsing log, completed traces ::   9%|8         | 2739/31509 [00:05<00:56, 505.61it/s]","\rparsing log, completed traces ::   9%|8         | 2806/31509 [00:05<00:52, 544.14it/s]","\rparsing log, completed traces ::   9%|9         | 2880/31509 [00:05<00:48, 593.37it/s]","\rparsing log, completed traces ::   9%|9         | 2952/31509 [00:05<00:45, 625.19it/s]","\rparsing log, completed traces ::  10%|9         | 3022/31509 [00:05<00:44, 642.80it/s]","\rparsing log, completed traces ::  10%|9         | 3090/31509 [00:05<00:44, 644.48it/s]","\rparsing log, completed traces ::  10%|#         | 3157/31509 [00:06<00:44, 644.26it/s]","\rparsing log, completed traces ::  10%|#         | 3224/31509 [00:06<00:44, 634.95it/s]","\rparsing log, completed traces ::  10%|#         | 3298/31509 [00:06<00:42, 664.01it/s]","\rparsing log, completed traces ::  11%|#         | 3369/31509 [00:06<00:41, 676.01it/s]","\rparsing log, completed traces ::  11%|#         | 3446/31509 [00:06<00:40, 701.36it/s]","\rparsing log, completed traces ::  11%|#1        | 3523/31509 [00:06<00:39, 717.21it/s]","\rparsing log, completed traces ::  11%|#1        | 3596/31509 [00:06<00:40, 689.81it/s]","\rparsing log, completed traces ::  12%|#1        | 3667/31509 [00:06<00:40, 694.02it/s]","\rparsing log, completed traces ::  12%|#1        | 3737/31509 [00:06<00:39, 694.85it/s]","\rparsing log, completed traces ::  12%|#2        | 3807/31509 [00:07<01:20, 342.43it/s]","\rparsing log, completed traces ::  12%|#2        | 3873/31509 [00:07<01:09, 396.29it/s]","\rparsing log, completed traces ::  13%|#2        | 3943/31509 [00:07<01:00, 454.62it/s]","\rparsing log, completed traces ::  13%|#2        | 4016/31509 [00:07<00:53, 512.71it/s]","\rparsing log, completed traces ::  13%|#2        | 4083/31509 [00:07<00:50, 547.78it/s]","\rparsing log, completed traces ::  13%|#3        | 4153/31509 [00:07<00:46, 584.94it/s]","\rparsing log, completed traces ::  13%|#3        | 4220/31509 [00:07<00:45, 595.66it/s]","\rparsing log, completed traces ::  14%|#3        | 4285/31509 [00:08<00:45, 595.64it/s]","\rparsing log, completed traces ::  14%|#3        | 4351/31509 [00:08<00:44, 612.07it/s]","\rparsing log, completed traces ::  14%|#4        | 4419/31509 [00:08<00:43, 629.68it/s]","\rparsing log, completed traces ::  14%|#4        | 4485/31509 [00:08<00:43, 623.50it/s]","\rparsing log, completed traces ::  14%|#4        | 4552/31509 [00:08<00:42, 636.34it/s]","\rparsing log, completed traces ::  15%|#4        | 4618/31509 [00:08<00:41, 642.87it/s]","\rparsing log, completed traces ::  15%|#4        | 4687/31509 [00:08<00:41, 652.78it/s]","\rparsing log, completed traces ::  15%|#5        | 4760/31509 [00:08<00:39, 674.45it/s]","\rparsing log, completed traces ::  15%|#5        | 4828/31509 [00:08<00:40, 665.74it/s]","\rparsing log, completed traces ::  16%|#5        | 4895/31509 [00:08<00:40, 660.34it/s]","\rparsing log, completed traces ::  16%|#5        | 4962/31509 [00:09<00:40, 656.79it/s]","\rparsing log, completed traces ::  16%|#5        | 5031/31509 [00:09<00:39, 662.89it/s]","\rparsing log, completed traces ::  16%|#6        | 5103/31509 [00:09<00:38, 679.39it/s]","\rparsing log, completed traces ::  16%|#6        | 5172/31509 [00:09<00:39, 668.19it/s]","\rparsing log, completed traces ::  17%|#6        | 5239/31509 [00:09<01:20, 326.39it/s]","\rparsing log, completed traces ::  17%|#6        | 5307/31509 [00:09<01:08, 385.03it/s]","\rparsing log, completed traces ::  17%|#7        | 5374/31509 [00:10<00:59, 439.73it/s]","\rparsing log, completed traces ::  17%|#7        | 5437/31509 [00:10<00:54, 480.66it/s]","\rparsing log, completed traces ::  17%|#7        | 5510/31509 [00:10<00:48, 539.52it/s]","\rparsing log, completed traces ::  18%|#7        | 5583/31509 [00:10<00:44, 585.18it/s]","\rparsing log, completed traces ::  18%|#7        | 5657/31509 [00:10<00:41, 625.46it/s]","\rparsing log, completed traces ::  18%|#8        | 5735/31509 [00:10<00:38, 667.34it/s]","\rparsing log, completed traces ::  18%|#8        | 5807/31509 [00:10<00:38, 674.48it/s]","\rparsing log, completed traces ::  19%|#8        | 5880/31509 [00:10<00:37, 690.19it/s]","\rparsing log, completed traces ::  19%|#8        | 5956/31509 [00:10<00:36, 707.26it/s]","\rparsing log, completed traces ::  19%|#9        | 6029/31509 [00:10<00:36, 695.11it/s]","\rparsing log, completed traces ::  19%|#9        | 6100/31509 [00:11<00:36, 687.86it/s]","\rparsing log, completed traces ::  20%|#9        | 6172/31509 [00:11<00:36, 696.73it/s]","\rparsing log, completed traces ::  20%|#9        | 6243/31509 [00:11<00:36, 699.72it/s]","\rparsing log, completed traces ::  20%|##        | 6314/31509 [00:11<00:36, 683.07it/s]","\rparsing log, completed traces ::  20%|##        | 6387/31509 [00:11<00:36, 695.49it/s]","\rparsing log, completed traces ::  20%|##        | 6457/31509 [00:11<00:36, 679.90it/s]","\rparsing log, completed traces ::  21%|##        | 6526/31509 [00:11<00:37, 666.39it/s]","\rparsing log, completed traces ::  21%|##        | 6593/31509 [00:11<00:38, 641.77it/s]","\rparsing log, completed traces ::  21%|##1       | 6660/31509 [00:11<00:38, 648.40it/s]","\rparsing log, completed traces ::  21%|##1       | 6730/31509 [00:12<00:37, 662.95it/s]","\rparsing log, completed traces ::  22%|##1       | 6797/31509 [00:12<00:37, 660.98it/s]","\rparsing log, completed traces ::  22%|##1       | 6864/31509 [00:12<01:24, 292.88it/s]","\rparsing log, completed traces ::  22%|##2       | 6935/31509 [00:12<01:08, 357.45it/s]","\rparsing log, completed traces ::  22%|##2       | 6999/31509 [00:12<01:00, 407.63it/s]","\rparsing log, completed traces ::  22%|##2       | 7074/31509 [00:12<00:51, 477.47it/s]","\rparsing log, completed traces ::  23%|##2       | 7142/31509 [00:13<00:46, 521.57it/s]","\rparsing log, completed traces ::  23%|##2       | 7207/31509 [00:13<00:44, 540.64it/s]","\rparsing log, completed traces ::  23%|##3       | 7275/31509 [00:13<00:42, 573.61it/s]","\rparsing log, completed traces ::  23%|##3       | 7340/31509 [00:13<00:41, 588.47it/s]","\rparsing log, completed traces ::  24%|##3       | 7407/31509 [00:13<00:39, 606.30it/s]","\rparsing log, completed traces ::  24%|##3       | 7478/31509 [00:13<00:37, 634.27it/s]","\rparsing log, completed traces ::  24%|##3       | 7551/31509 [00:13<00:36, 660.17it/s]","\rparsing log, completed traces ::  24%|##4       | 7620/31509 [00:13<00:36, 660.65it/s]","\rparsing log, completed traces ::  24%|##4       | 7688/31509 [00:13<00:36, 656.39it/s]","\rparsing log, completed traces ::  25%|##4       | 7755/31509 [00:13<00:35, 660.07it/s]","\rparsing log, completed traces ::  25%|##4       | 7822/31509 [00:14<00:36, 653.49it/s]","\rparsing log, completed traces ::  25%|##5       | 7894/31509 [00:14<00:35, 671.13it/s]","\rparsing log, completed traces ::  25%|##5       | 7964/31509 [00:14<00:34, 675.45it/s]","\rparsing log, completed traces ::  26%|##5       | 8035/31509 [00:14<00:34, 682.61it/s]","\rparsing log, completed traces ::  26%|##5       | 8104/31509 [00:14<00:34, 684.68it/s]","\rparsing log, completed traces ::  26%|##5       | 8173/31509 [00:14<00:34, 683.10it/s]","\rparsing log, completed traces ::  26%|##6       | 8244/31509 [00:14<00:33, 688.93it/s]","\rparsing log, completed traces ::  26%|##6       | 8315/31509 [00:14<00:33, 694.08it/s]","\rparsing log, completed traces ::  27%|##6       | 8385/31509 [00:14<00:34, 679.80it/s]","\rparsing log, completed traces ::  27%|##6       | 8454/31509 [00:15<00:34, 668.61it/s]","\rparsing log, completed traces ::  27%|##7       | 8524/31509 [00:15<00:34, 675.69it/s]","\rparsing log, completed traces ::  27%|##7       | 8592/31509 [00:15<00:34, 662.05it/s]","\rparsing log, completed traces ::  27%|##7       | 8659/31509 [00:15<01:22, 276.70it/s]","\rparsing log, completed traces ::  28%|##7       | 8727/31509 [00:15<01:07, 335.73it/s]","\rparsing log, completed traces ::  28%|##7       | 8796/31509 [00:15<00:57, 396.48it/s]","\rparsing log, completed traces ::  28%|##8       | 8864/31509 [00:16<00:50, 451.86it/s]","\rparsing log, completed traces ::  28%|##8       | 8927/31509 [00:16<00:46, 490.34it/s]","\rparsing log, completed traces ::  29%|##8       | 8994/31509 [00:16<00:42, 530.94it/s]","\rparsing log, completed traces ::  29%|##8       | 9058/31509 [00:16<00:41, 545.29it/s]","\rparsing log, completed traces ::  29%|##8       | 9125/31509 [00:16<00:38, 577.64it/s]","\rparsing log, completed traces ::  29%|##9       | 9193/31509 [00:16<00:37, 601.48it/s]","\rparsing log, completed traces ::  29%|##9       | 9258/31509 [00:16<00:36, 601.96it/s]","\rparsing log, completed traces ::  30%|##9       | 9331/31509 [00:16<00:35, 633.40it/s]","\rparsing log, completed traces ::  30%|##9       | 9397/31509 [00:16<00:35, 631.69it/s]","\rparsing log, completed traces ::  30%|###       | 9462/31509 [00:17<00:34, 634.38it/s]","\rparsing log, completed traces ::  30%|###       | 9529/31509 [00:17<00:34, 644.56it/s]","\rparsing log, completed traces ::  30%|###       | 9595/31509 [00:17<00:34, 635.32it/s]","\rparsing log, completed traces ::  31%|###       | 9662/31509 [00:17<00:33, 644.85it/s]","\rparsing log, completed traces ::  31%|###       | 9727/31509 [00:17<00:34, 633.58it/s]","\rparsing log, completed traces ::  31%|###1      | 9795/31509 [00:17<00:33, 644.37it/s]","\rparsing log, completed traces ::  31%|###1      | 9860/31509 [00:17<00:33, 639.99it/s]","\rparsing log, completed traces ::  31%|###1      | 9925/31509 [00:17<00:34, 634.32it/s]","\rparsing log, completed traces ::  32%|###1      | 9989/31509 [00:17<00:34, 631.49it/s]","\rparsing log, completed traces ::  32%|###1      | 10053/31509 [00:17<00:34, 626.35it/s]","\rparsing log, completed traces ::  32%|###2      | 10116/31509 [00:18<00:35, 604.08it/s]","\rparsing log, completed traces ::  32%|###2      | 10178/31509 [00:18<00:35, 608.48it/s]","\rparsing log, completed traces ::  33%|###2      | 10241/31509 [00:18<00:34, 613.53it/s]","\rparsing log, completed traces ::  33%|###2      | 10303/31509 [00:18<00:34, 612.44it/s]","\rparsing log, completed traces ::  33%|###2      | 10365/31509 [00:18<00:36, 586.91it/s]","\rparsing log, completed traces ::  33%|###3      | 10428/31509 [00:18<00:35, 598.58it/s]","\rparsing log, completed traces ::  33%|###3      | 10489/31509 [00:18<00:35, 593.54it/s]","\rparsing log, completed traces ::  33%|###3      | 10549/31509 [00:19<01:26, 242.78it/s]","\rparsing log, completed traces ::  34%|###3      | 10612/31509 [00:19<01:10, 296.91it/s]","\rparsing log, completed traces ::  34%|###3      | 10673/31509 [00:19<00:59, 349.63it/s]","\rparsing log, completed traces ::  34%|###4      | 10736/31509 [00:19<00:51, 403.24it/s]","\rparsing log, completed traces ::  34%|###4      | 10792/31509 [00:19<00:47, 434.42it/s]","\rparsing log, completed traces ::  34%|###4      | 10848/31509 [00:19<00:44, 460.87it/s]","\rparsing log, completed traces ::  35%|###4      | 10905/31509 [00:19<00:42, 487.54it/s]","\rparsing log, completed traces ::  35%|###4      | 10967/31509 [00:20<00:39, 520.45it/s]","\rparsing log, completed traces ::  35%|###5      | 11033/31509 [00:20<00:36, 555.33it/s]","\rparsing log, completed traces ::  35%|###5      | 11099/31509 [00:20<00:35, 581.99it/s]","\rparsing log, completed traces ::  35%|###5      | 11165/31509 [00:20<00:33, 603.06it/s]","\rparsing log, completed traces ::  36%|###5      | 11230/31509 [00:20<00:32, 615.97it/s]","\rparsing log, completed traces ::  36%|###5      | 11296/31509 [00:20<00:32, 626.79it/s]","\rparsing log, completed traces ::  36%|###6      | 11360/31509 [00:20<00:32, 616.56it/s]","\rparsing log, completed traces ::  36%|###6      | 11424/31509 [00:20<00:32, 622.26it/s]","\rparsing log, completed traces ::  36%|###6      | 11489/31509 [00:20<00:31, 627.19it/s]","\rparsing log, completed traces ::  37%|###6      | 11553/31509 [00:20<00:32, 614.18it/s]","\rparsing log, completed traces ::  37%|###6      | 11619/31509 [00:21<00:31, 625.10it/s]","\rparsing log, completed traces ::  37%|###7      | 11682/31509 [00:21<00:31, 625.05it/s]","\rparsing log, completed traces ::  37%|###7      | 11747/31509 [00:21<00:31, 631.61it/s]","\rparsing log, completed traces ::  37%|###7      | 11814/31509 [00:21<00:30, 641.93it/s]","\rparsing log, completed traces ::  38%|###7      | 11883/31509 [00:21<00:29, 655.11it/s]","\rparsing log, completed traces ::  38%|###7      | 11954/31509 [00:21<00:29, 670.93it/s]","\rparsing log, completed traces ::  38%|###8      | 12022/31509 [00:21<00:29, 658.60it/s]","\rparsing log, completed traces ::  38%|###8      | 12088/31509 [00:21<00:29, 658.44it/s]","\rparsing log, completed traces ::  39%|###8      | 12154/31509 [00:21<00:29, 654.44it/s]","\rparsing log, completed traces ::  39%|###8      | 12223/31509 [00:21<00:29, 664.52it/s]","\rparsing log, completed traces ::  39%|###9      | 12290/31509 [00:22<00:29, 657.44it/s]","\rparsing log, completed traces ::  39%|###9      | 12357/31509 [00:22<00:29, 658.87it/s]","\rparsing log, completed traces ::  39%|###9      | 12427/31509 [00:22<00:28, 666.02it/s]","\rparsing log, completed traces ::  40%|###9      | 12494/31509 [00:22<00:28, 663.30it/s]","\rparsing log, completed traces ::  40%|###9      | 12561/31509 [00:22<00:28, 654.08it/s]","\rparsing log, completed traces ::  40%|####      | 12629/31509 [00:22<00:28, 659.65it/s]","\rparsing log, completed traces ::  40%|####      | 12695/31509 [00:23<01:17, 242.23it/s]","\rparsing log, completed traces ::  41%|####      | 12762/31509 [00:23<01:02, 298.89it/s]","\rparsing log, completed traces ::  41%|####      | 12828/31509 [00:23<00:52, 356.41it/s]","\rparsing log, completed traces ::  41%|####      | 12892/31509 [00:23<00:45, 408.95it/s]","\rparsing log, completed traces ::  41%|####1     | 12954/31509 [00:23<00:40, 452.87it/s]","\rparsing log, completed traces ::  41%|####1     | 13024/31509 [00:23<00:36, 508.21it/s]","\rparsing log, completed traces ::  42%|####1     | 13101/31509 [00:23<00:32, 571.93it/s]","\rparsing log, completed traces ::  42%|####1     | 13168/31509 [00:23<00:31, 585.32it/s]","\rparsing log, completed traces ::  42%|####2     | 13234/31509 [00:24<00:30, 601.05it/s]","\rparsing log, completed traces ::  42%|####2     | 13300/31509 [00:24<00:29, 611.27it/s]","\rparsing log, completed traces ::  42%|####2     | 13366/31509 [00:24<00:29, 624.88it/s]","\rparsing log, completed traces ::  43%|####2     | 13433/31509 [00:24<00:28, 630.95it/s]","\rparsing log, completed traces ::  43%|####2     | 13498/31509 [00:24<00:28, 636.26it/s]","\rparsing log, completed traces ::  43%|####3     | 13563/31509 [00:24<00:29, 615.02it/s]","\rparsing log, completed traces ::  43%|####3     | 13626/31509 [00:24<00:29, 613.49it/s]","\rparsing log, completed traces ::  43%|####3     | 13690/31509 [00:24<00:28, 620.98it/s]","\rparsing log, completed traces ::  44%|####3     | 13759/31509 [00:24<00:27, 638.82it/s]","\rparsing log, completed traces ::  44%|####3     | 13824/31509 [00:24<00:27, 638.79it/s]","\rparsing log, completed traces ::  44%|####4     | 13889/31509 [00:25<00:28, 626.10it/s]","\rparsing log, completed traces ::  44%|####4     | 13955/31509 [00:25<00:27, 634.83it/s]","\rparsing log, completed traces ::  44%|####4     | 14020/31509 [00:25<00:27, 636.55it/s]","\rparsing log, completed traces ::  45%|####4     | 14089/31509 [00:25<00:26, 645.65it/s]","\rparsing log, completed traces ::  45%|####4     | 14159/31509 [00:25<00:26, 660.13it/s]","\rparsing log, completed traces ::  45%|####5     | 14226/31509 [00:25<00:26, 657.47it/s]","\rparsing log, completed traces ::  45%|####5     | 14293/31509 [00:25<00:26, 660.83it/s]","\rparsing log, completed traces ::  46%|####5     | 14364/31509 [00:25<00:25, 673.95it/s]","\rparsing log, completed traces ::  46%|####5     | 14433/31509 [00:25<00:25, 675.59it/s]","\rparsing log, completed traces ::  46%|####6     | 14501/31509 [00:26<00:25, 676.20it/s]","\rparsing log, completed traces ::  46%|####6     | 14569/31509 [00:26<00:26, 651.28it/s]","\rparsing log, completed traces ::  46%|####6     | 14635/31509 [00:26<00:26, 639.50it/s]","\rparsing log, completed traces ::  47%|####6     | 14702/31509 [00:26<00:25, 647.22it/s]","\rparsing log, completed traces ::  47%|####6     | 14767/31509 [00:26<00:25, 646.34it/s]","\rparsing log, completed traces ::  47%|####7     | 14838/31509 [00:26<00:25, 662.66it/s]","\rparsing log, completed traces ::  47%|####7     | 14905/31509 [00:26<00:25, 657.93it/s]","\rparsing log, completed traces ::  48%|####7     | 14976/31509 [00:26<00:24, 672.37it/s]","\rparsing log, completed traces ::  48%|####7     | 15044/31509 [00:26<00:24, 671.13it/s]","\rparsing log, completed traces ::  48%|####7     | 15116/31509 [00:26<00:23, 684.23it/s]","\rparsing log, completed traces ::  48%|####8     | 15185/31509 [00:27<01:09, 235.31it/s]","\rparsing log, completed traces ::  48%|####8     | 15253/31509 [00:27<00:55, 291.37it/s]","\rparsing log, completed traces ::  49%|####8     | 15326/31509 [00:27<00:45, 358.23it/s]","\rparsing log, completed traces ::  49%|####8     | 15396/31509 [00:27<00:38, 419.58it/s]","\rparsing log, completed traces ::  49%|####9     | 15461/31509 [00:28<00:34, 465.92it/s]","\rparsing log, completed traces ::  49%|####9     | 15527/31509 [00:28<00:31, 508.48it/s]","\rparsing log, completed traces ::  50%|####9     | 15597/31509 [00:28<00:28, 554.71it/s]","\rparsing log, completed traces ::  50%|####9     | 15671/31509 [00:28<00:26, 599.88it/s]","\rparsing log, completed traces ::  50%|####9     | 15739/31509 [00:28<00:25, 609.26it/s]","\rparsing log, completed traces ::  50%|#####     | 15807/31509 [00:28<00:25, 626.58it/s]","\rparsing log, completed traces ::  50%|#####     | 15880/31509 [00:28<00:23, 653.28it/s]","\rparsing log, completed traces ::  51%|#####     | 15949/31509 [00:28<00:23, 657.42it/s]","\rparsing log, completed traces ::  51%|#####     | 16017/31509 [00:28<00:23, 661.00it/s]","\rparsing log, completed traces ::  51%|#####1    | 16090/31509 [00:29<00:22, 678.81it/s]","\rparsing log, completed traces ::  51%|#####1    | 16165/31509 [00:29<00:21, 698.52it/s]","\rparsing log, completed traces ::  52%|#####1    | 16237/31509 [00:29<00:21, 703.69it/s]","\rparsing log, completed traces ::  52%|#####1    | 16309/31509 [00:29<00:21, 707.40it/s]","\rparsing log, completed traces ::  52%|#####1    | 16381/31509 [00:29<00:22, 676.29it/s]","\rparsing log, completed traces ::  52%|#####2    | 16450/31509 [00:29<00:22, 668.71it/s]","\rparsing log, completed traces ::  52%|#####2    | 16518/31509 [00:29<00:23, 646.38it/s]","\rparsing log, completed traces ::  53%|#####2    | 16589/31509 [00:29<00:22, 661.77it/s]","\rparsing log, completed traces ::  53%|#####2    | 16662/31509 [00:29<00:21, 680.27it/s]","\rparsing log, completed traces ::  53%|#####3    | 16731/31509 [00:29<00:21, 681.84it/s]","\rparsing log, completed traces ::  53%|#####3    | 16800/31509 [00:30<00:21, 672.66it/s]","\rparsing log, completed traces ::  54%|#####3    | 16868/31509 [00:30<00:21, 674.01it/s]","\rparsing log, completed traces ::  54%|#####3    | 16938/31509 [00:30<00:21, 681.07it/s]","\rparsing log, completed traces ::  54%|#####3    | 17007/31509 [00:30<00:21, 682.77it/s]","\rparsing log, completed traces ::  54%|#####4    | 17086/31509 [00:30<00:20, 714.31it/s]","\rparsing log, completed traces ::  54%|#####4    | 17158/31509 [00:30<00:20, 705.26it/s]","\rparsing log, completed traces ::  55%|#####4    | 17229/31509 [00:30<00:20, 687.89it/s]","\rparsing log, completed traces ::  55%|#####4    | 17301/31509 [00:30<00:20, 694.82it/s]","\rparsing log, completed traces ::  55%|#####5    | 17371/31509 [00:30<00:20, 689.95it/s]","\rparsing log, completed traces ::  55%|#####5    | 17447/31509 [00:30<00:19, 708.10it/s]","\rparsing log, completed traces ::  56%|#####5    | 17518/31509 [00:31<00:20, 676.68it/s]","\rparsing log, completed traces ::  56%|#####5    | 17591/31509 [00:31<00:20, 690.78it/s]","\rparsing log, completed traces ::  56%|#####6    | 17668/31509 [00:31<00:19, 713.32it/s]","\rparsing log, completed traces ::  56%|#####6    | 17740/31509 [00:31<00:19, 697.69it/s]","\rparsing log, completed traces ::  57%|#####6    | 17812/31509 [00:31<00:19, 702.37it/s]","\rparsing log, completed traces ::  57%|#####6    | 17884/31509 [00:31<00:19, 706.37it/s]","\rparsing log, completed traces ::  57%|#####6    | 17957/31509 [00:31<00:19, 712.83it/s]","\rparsing log, completed traces ::  57%|#####7    | 18031/31509 [00:31<00:18, 720.36it/s]","\rparsing log, completed traces ::  57%|#####7    | 18104/31509 [00:31<00:18, 718.57it/s]","\rparsing log, completed traces ::  58%|#####7    | 18176/31509 [00:32<00:57, 232.44it/s]","\rparsing log, completed traces ::  58%|#####7    | 18245/31509 [00:32<00:46, 287.28it/s]","\rparsing log, completed traces ::  58%|#####8    | 18312/31509 [00:32<00:38, 342.59it/s]","\rparsing log, completed traces ::  58%|#####8    | 18386/31509 [00:33<00:31, 411.26it/s]","\rparsing log, completed traces ::  59%|#####8    | 18457/31509 [00:33<00:27, 470.25it/s]","\rparsing log, completed traces ::  59%|#####8    | 18524/31509 [00:33<00:25, 512.80it/s]","\rparsing log, completed traces ::  59%|#####9    | 18591/31509 [00:33<00:23, 545.10it/s]","\rparsing log, completed traces ::  59%|#####9    | 18669/31509 [00:33<00:21, 603.89it/s]","\rparsing log, completed traces ::  59%|#####9    | 18744/31509 [00:33<00:19, 639.82it/s]","\rparsing log, completed traces ::  60%|#####9    | 18815/31509 [00:33<00:19, 647.08it/s]","\rparsing log, completed traces ::  60%|#####9    | 18890/31509 [00:33<00:18, 674.37it/s]","\rparsing log, completed traces ::  60%|######    | 18962/31509 [00:33<00:18, 684.78it/s]","\rparsing log, completed traces ::  60%|######    | 19033/31509 [00:33<00:18, 690.46it/s]","\rparsing log, completed traces ::  61%|######    | 19106/31509 [00:34<00:17, 699.21it/s]","\rparsing log, completed traces ::  61%|######    | 19178/31509 [00:34<00:17, 704.07it/s]","\rparsing log, completed traces ::  61%|######1   | 19250/31509 [00:34<00:17, 696.35it/s]","\rparsing log, completed traces ::  61%|######1   | 19321/31509 [00:34<00:17, 696.04it/s]","\rparsing log, completed traces ::  62%|######1   | 19397/31509 [00:34<00:16, 712.52it/s]","\rparsing log, completed traces ::  62%|######1   | 19469/31509 [00:34<00:16, 713.14it/s]","\rparsing log, completed traces ::  62%|######2   | 19541/31509 [00:34<00:16, 709.39it/s]","\rparsing log, completed traces ::  62%|######2   | 19613/31509 [00:34<00:16, 709.41it/s]","\rparsing log, completed traces ::  62%|######2   | 19685/31509 [00:34<00:17, 690.97it/s]","\rparsing log, completed traces ::  63%|######2   | 19756/31509 [00:34<00:16, 694.33it/s]","\rparsing log, completed traces ::  63%|######2   | 19826/31509 [00:35<00:16, 688.28it/s]","\rparsing log, completed traces ::  63%|######3   | 19895/31509 [00:35<00:17, 677.28it/s]","\rparsing log, completed traces ::  63%|######3   | 19963/31509 [00:35<00:17, 678.03it/s]","\rparsing log, completed traces ::  64%|######3   | 20031/31509 [00:35<00:17, 674.20it/s]","\rparsing log, completed traces ::  64%|######3   | 20099/31509 [00:35<00:17, 666.38it/s]","\rparsing log, completed traces ::  64%|######4   | 20168/31509 [00:35<00:16, 672.45it/s]","\rparsing log, completed traces ::  64%|######4   | 20242/31509 [00:35<00:16, 690.73it/s]","\rparsing log, completed traces ::  64%|######4   | 20313/31509 [00:35<00:16, 696.31it/s]","\rparsing log, completed traces ::  65%|######4   | 20383/31509 [00:35<00:15, 696.86it/s]","\rparsing log, completed traces ::  65%|######4   | 20462/31509 [00:35<00:15, 723.08it/s]","\rparsing log, completed traces ::  65%|######5   | 20535/31509 [00:36<00:15, 717.54it/s]","\rparsing log, completed traces ::  65%|######5   | 20608/31509 [00:36<00:15, 720.38it/s]","\rparsing log, completed traces ::  66%|######5   | 20683/31509 [00:36<00:14, 728.11it/s]","\rparsing log, completed traces ::  66%|######5   | 20758/31509 [00:36<00:14, 731.82it/s]","\rparsing log, completed traces ::  66%|######6   | 20832/31509 [00:36<00:15, 709.99it/s]","\rparsing log, completed traces ::  66%|######6   | 20904/31509 [00:36<00:14, 712.72it/s]","\rparsing log, completed traces ::  67%|######6   | 20976/31509 [00:36<00:15, 698.20it/s]","\rparsing log, completed traces ::  67%|######6   | 21046/31509 [00:36<00:15, 685.38it/s]","\rparsing log, completed traces ::  67%|######7   | 21115/31509 [00:36<00:15, 684.55it/s]","\rparsing log, completed traces ::  67%|######7   | 21184/31509 [00:37<00:15, 680.27it/s]","\rparsing log, completed traces ::  67%|######7   | 21259/31509 [00:37<00:14, 700.21it/s]","\rparsing log, completed traces ::  68%|######7   | 21330/31509 [00:37<00:14, 701.30it/s]","\rparsing log, completed traces ::  68%|######7   | 21401/31509 [00:37<00:14, 690.64it/s]","\rparsing log, completed traces ::  68%|######8   | 21471/31509 [00:38<00:48, 205.81it/s]","\rparsing log, completed traces ::  68%|######8   | 21545/31509 [00:38<00:37, 264.60it/s]","\rparsing log, completed traces ::  69%|######8   | 21616/31509 [00:38<00:30, 325.03it/s]","\rparsing log, completed traces ::  69%|######8   | 21680/31509 [00:38<00:26, 375.70it/s]","\rparsing log, completed traces ::  69%|######9   | 21761/31509 [00:38<00:21, 457.24it/s]","\rparsing log, completed traces ::  69%|######9   | 21835/31509 [00:38<00:18, 516.88it/s]","\rparsing log, completed traces ::  70%|######9   | 21912/31509 [00:38<00:16, 575.24it/s]","\rparsing log, completed traces ::  70%|######9   | 21984/31509 [00:38<00:15, 608.17it/s]","\rparsing log, completed traces ::  70%|#######   | 22061/31509 [00:39<00:14, 649.44it/s]","\rparsing log, completed traces ::  70%|#######   | 22136/31509 [00:39<00:13, 674.59it/s]","\rparsing log, completed traces ::  70%|#######   | 22210/31509 [00:39<00:13, 683.60it/s]","\rparsing log, completed traces ::  71%|#######   | 22284/31509 [00:39<00:13, 694.44it/s]","\rparsing log, completed traces ::  71%|#######   | 22357/31509 [00:39<00:13, 694.03it/s]","\rparsing log, completed traces ::  71%|#######1  | 22434/31509 [00:39<00:12, 714.53it/s]","\rparsing log, completed traces ::  71%|#######1  | 22510/31509 [00:39<00:12, 725.24it/s]","\rparsing log, completed traces ::  72%|#######1  | 22584/31509 [00:39<00:12, 711.45it/s]","\rparsing log, completed traces ::  72%|#######1  | 22656/31509 [00:39<00:12, 703.13it/s]","\rparsing log, completed traces ::  72%|#######2  | 22727/31509 [00:39<00:12, 699.37it/s]","\rparsing log, completed traces ::  72%|#######2  | 22800/31509 [00:40<00:12, 705.56it/s]","\rparsing log, completed traces ::  73%|#######2  | 22871/31509 [00:40<00:12, 706.33it/s]","\rparsing log, completed traces ::  73%|#######2  | 22942/31509 [00:40<00:12, 680.23it/s]","\rparsing log, completed traces ::  73%|#######3  | 23011/31509 [00:40<00:12, 676.07it/s]","\rparsing log, completed traces ::  73%|#######3  | 23081/31509 [00:40<00:12, 679.09it/s]","\rparsing log, completed traces ::  73%|#######3  | 23150/31509 [00:40<00:12, 677.73it/s]","\rparsing log, completed traces ::  74%|#######3  | 23218/31509 [00:40<00:12, 674.92it/s]","\rparsing log, completed traces ::  74%|#######3  | 23286/31509 [00:40<00:12, 668.84it/s]","\rparsing log, completed traces ::  74%|#######4  | 23353/31509 [00:40<00:12, 657.25it/s]","\rparsing log, completed traces ::  74%|#######4  | 23421/31509 [00:41<00:12, 660.96it/s]","\rparsing log, completed traces ::  75%|#######4  | 23488/31509 [00:41<00:12, 662.87it/s]","\rparsing log, completed traces ::  75%|#######4  | 23558/31509 [00:41<00:11, 673.12it/s]","\rparsing log, completed traces ::  75%|#######4  | 23629/31509 [00:41<00:11, 681.20it/s]","\rparsing log, completed traces ::  75%|#######5  | 23698/31509 [00:41<00:11, 678.52it/s]","\rparsing log, completed traces ::  75%|#######5  | 23770/31509 [00:41<00:11, 689.53it/s]","\rparsing log, completed traces ::  76%|#######5  | 23839/31509 [00:41<00:11, 677.59it/s]","\rparsing log, completed traces ::  76%|#######5  | 23908/31509 [00:41<00:11, 679.41it/s]","\rparsing log, completed traces ::  76%|#######6  | 23976/31509 [00:41<00:11, 678.21it/s]","\rparsing log, completed traces ::  76%|#######6  | 24044/31509 [00:41<00:11, 674.94it/s]","\rparsing log, completed traces ::  77%|#######6  | 24115/31509 [00:42<00:10, 684.79it/s]","\rparsing log, completed traces ::  77%|#######6  | 24184/31509 [00:42<00:10, 685.84it/s]","\rparsing log, completed traces ::  77%|#######6  | 24253/31509 [00:42<00:10, 677.10it/s]","\rparsing log, completed traces ::  77%|#######7  | 24326/31509 [00:42<00:10, 691.57it/s]","\rparsing log, completed traces ::  77%|#######7  | 24397/31509 [00:42<00:10, 696.18it/s]","\rparsing log, completed traces ::  78%|#######7  | 24467/31509 [00:42<00:10, 691.69it/s]","\rparsing log, completed traces ::  78%|#######7  | 24537/31509 [00:42<00:10, 692.39it/s]","\rparsing log, completed traces ::  78%|#######8  | 24617/31509 [00:42<00:09, 721.45it/s]","\rparsing log, completed traces ::  78%|#######8  | 24690/31509 [00:42<00:09, 707.99it/s]","\rparsing log, completed traces ::  79%|#######8  | 24761/31509 [00:42<00:09, 707.89it/s]","\rparsing log, completed traces ::  79%|#######8  | 24835/31509 [00:43<00:09, 714.27it/s]","\rparsing log, completed traces ::  79%|#######9  | 24907/31509 [00:43<00:09, 713.71it/s]","\rparsing log, completed traces ::  79%|#######9  | 24983/31509 [00:43<00:09, 723.21it/s]","\rparsing log, completed traces ::  80%|#######9  | 25056/31509 [00:43<00:09, 705.02it/s]","\rparsing log, completed traces ::  80%|#######9  | 25127/31509 [00:43<00:09, 689.77it/s]","\rparsing log, completed traces ::  80%|#######9  | 25197/31509 [00:44<00:33, 190.52it/s]","\rparsing log, completed traces ::  80%|########  | 25263/31509 [00:44<00:26, 238.35it/s]","\rparsing log, completed traces ::  80%|########  | 25322/31509 [00:44<00:21, 282.56it/s]","\rparsing log, completed traces ::  81%|########  | 25396/31509 [00:44<00:17, 352.47it/s]","\rparsing log, completed traces ::  81%|########  | 25463/31509 [00:44<00:14, 409.20it/s]","\rparsing log, completed traces ::  81%|########1 | 25531/31509 [00:44<00:12, 464.20it/s]","\rparsing log, completed traces ::  81%|########1 | 25603/31509 [00:45<00:11, 519.40it/s]","\rparsing log, completed traces ::  81%|########1 | 25670/31509 [00:45<00:10, 552.76it/s]","\rparsing log, completed traces ::  82%|########1 | 25738/31509 [00:45<00:09, 583.98it/s]","\rparsing log, completed traces ::  82%|########1 | 25806/31509 [00:45<00:09, 608.08it/s]","\rparsing log, completed traces ::  82%|########2 | 25873/31509 [00:45<00:09, 624.51it/s]","\rparsing log, completed traces ::  82%|########2 | 25943/31509 [00:45<00:08, 643.49it/s]","\rparsing log, completed traces ::  83%|########2 | 26011/31509 [00:45<00:08, 640.79it/s]","\rparsing log, completed traces ::  83%|########2 | 26078/31509 [00:45<00:08, 645.91it/s]","\rparsing log, completed traces ::  83%|########2 | 26148/31509 [00:45<00:08, 652.58it/s]","\rparsing log, completed traces ::  83%|########3 | 26220/31509 [00:46<00:07, 672.05it/s]","\rparsing log, completed traces ::  83%|########3 | 26292/31509 [00:46<00:07, 684.06it/s]","\rparsing log, completed traces ::  84%|########3 | 26364/31509 [00:46<00:07, 694.53it/s]","\rparsing log, completed traces ::  84%|########3 | 26434/31509 [00:46<00:07, 666.59it/s]","\rparsing log, completed traces ::  84%|########4 | 26502/31509 [00:46<00:07, 653.29it/s]","\rparsing log, completed traces ::  84%|########4 | 26569/31509 [00:46<00:07, 657.68it/s]","\rparsing log, completed traces ::  85%|########4 | 26636/31509 [00:46<00:07, 654.91it/s]","\rparsing log, completed traces ::  85%|########4 | 26703/31509 [00:46<00:07, 658.51it/s]","\rparsing log, completed traces ::  85%|########4 | 26775/31509 [00:46<00:07, 673.59it/s]","\rparsing log, completed traces ::  85%|########5 | 26844/31509 [00:46<00:06, 676.29it/s]","\rparsing log, completed traces ::  85%|########5 | 26912/31509 [00:47<00:06, 666.20it/s]","\rparsing log, completed traces ::  86%|########5 | 26980/31509 [00:47<00:06, 668.97it/s]","\rparsing log, completed traces ::  86%|########5 | 27047/31509 [00:47<00:06, 654.00it/s]","\rparsing log, completed traces ::  86%|########6 | 27116/31509 [00:47<00:06, 662.32it/s]","\rparsing log, completed traces ::  86%|########6 | 27186/31509 [00:47<00:06, 672.06it/s]","\rparsing log, completed traces ::  87%|########6 | 27260/31509 [00:47<00:06, 691.06it/s]","\rparsing log, completed traces ::  87%|########6 | 27330/31509 [00:47<00:06, 667.46it/s]","\rparsing log, completed traces ::  87%|########6 | 27399/31509 [00:47<00:06, 672.94it/s]","\rparsing log, completed traces ::  87%|########7 | 27468/31509 [00:47<00:05, 676.07it/s]","\rparsing log, completed traces ::  87%|########7 | 27536/31509 [00:47<00:05, 669.67it/s]","\rparsing log, completed traces ::  88%|########7 | 27610/31509 [00:48<00:05, 686.40it/s]","\rparsing log, completed traces ::  88%|########7 | 27681/31509 [00:48<00:05, 693.03it/s]","\rparsing log, completed traces ::  88%|########8 | 27756/31509 [00:48<00:05, 707.49it/s]","\rparsing log, completed traces ::  88%|########8 | 27827/31509 [00:48<00:05, 690.73it/s]","\rparsing log, completed traces ::  89%|########8 | 27897/31509 [00:48<00:05, 681.16it/s]","\rparsing log, completed traces ::  89%|########8 | 27966/31509 [00:48<00:05, 672.92it/s]","\rparsing log, completed traces ::  89%|########8 | 28038/31509 [00:48<00:05, 684.26it/s]","\rparsing log, completed traces ::  89%|########9 | 28107/31509 [00:48<00:05, 659.72it/s]","\rparsing log, completed traces ::  89%|########9 | 28174/31509 [00:48<00:05, 661.70it/s]","\rparsing log, completed traces ::  90%|########9 | 28246/31509 [00:49<00:04, 678.04it/s]","\rparsing log, completed traces ::  90%|########9 | 28314/31509 [00:49<00:04, 670.52it/s]","\rparsing log, completed traces ::  90%|######### | 28385/31509 [00:49<00:04, 680.46it/s]","\rparsing log, completed traces ::  90%|######### | 28454/31509 [00:49<00:04, 668.87it/s]","\rparsing log, completed traces ::  91%|######### | 28526/31509 [00:49<00:04, 683.61it/s]","\rparsing log, completed traces ::  91%|######### | 28599/31509 [00:49<00:04, 696.73it/s]","\rparsing log, completed traces ::  91%|######### | 28669/31509 [00:49<00:04, 691.31it/s]","\rparsing log, completed traces ::  91%|#########1| 28739/31509 [00:49<00:04, 654.40it/s]","\rparsing log, completed traces ::  91%|#########1| 28805/31509 [00:49<00:04, 643.44it/s]","\rparsing log, completed traces ::  92%|#########1| 28870/31509 [00:49<00:04, 628.60it/s]","\rparsing log, completed traces ::  92%|#########1| 28940/31509 [00:50<00:03, 646.19it/s]","\rparsing log, completed traces ::  92%|#########2| 29010/31509 [00:50<00:03, 659.17it/s]","\rparsing log, completed traces ::  92%|#########2| 29077/31509 [00:50<00:03, 647.55it/s]","\rparsing log, completed traces ::  92%|#########2| 29142/31509 [00:50<00:03, 647.64it/s]","\rparsing log, completed traces ::  93%|#########2| 29214/31509 [00:50<00:03, 668.05it/s]","\rparsing log, completed traces ::  93%|#########2| 29281/31509 [00:51<00:13, 168.66it/s]","\rparsing log, completed traces ::  93%|#########3| 29351/31509 [00:51<00:09, 219.39it/s]","\rparsing log, completed traces ::  93%|#########3| 29414/31509 [00:51<00:07, 268.53it/s]","\rparsing log, completed traces ::  94%|#########3| 29476/31509 [00:51<00:06, 319.31it/s]","\rparsing log, completed traces ::  94%|#########3| 29535/31509 [00:51<00:05, 363.59it/s]","\rparsing log, completed traces ::  94%|#########3| 29605/31509 [00:52<00:04, 428.59it/s]","\rparsing log, completed traces ::  94%|#########4| 29675/31509 [00:52<00:03, 486.58it/s]","\rparsing log, completed traces ::  94%|#########4| 29743/31509 [00:52<00:03, 531.70it/s]","\rparsing log, completed traces ::  95%|#########4| 29808/31509 [00:52<00:03, 556.23it/s]","\rparsing log, completed traces ::  95%|#########4| 29876/31509 [00:52<00:02, 588.50it/s]","\rparsing log, completed traces ::  95%|#########5| 29944/31509 [00:52<00:02, 613.05it/s]","\rparsing log, completed traces ::  95%|#########5| 30012/31509 [00:52<00:02, 629.70it/s]","\rparsing log, completed traces ::  95%|#########5| 30079/31509 [00:52<00:02, 630.48it/s]","\rparsing log, completed traces ::  96%|#########5| 30152/31509 [00:52<00:02, 657.82it/s]","\rparsing log, completed traces ::  96%|#########5| 30223/31509 [00:53<00:01, 669.52it/s]","\rparsing log, completed traces ::  96%|#########6| 30292/31509 [00:53<00:01, 667.61it/s]","\rparsing log, completed traces ::  96%|#########6| 30366/31509 [00:53<00:01, 688.73it/s]","\rparsing log, completed traces ::  97%|#########6| 30436/31509 [00:53<00:01, 679.73it/s]","\rparsing log, completed traces ::  97%|#########6| 30505/31509 [00:53<00:01, 677.36it/s]","\rparsing log, completed traces ::  97%|#########7| 30580/31509 [00:53<00:01, 697.49it/s]","\rparsing log, completed traces ::  97%|#########7| 30651/31509 [00:53<00:01, 692.13it/s]","\rparsing log, completed traces ::  97%|#########7| 30721/31509 [00:53<00:01, 692.77it/s]","\rparsing log, completed traces ::  98%|#########7| 30791/31509 [00:53<00:01, 687.77it/s]","\rparsing log, completed traces ::  98%|#########7| 30861/31509 [00:53<00:00, 688.98it/s]","\rparsing log, completed traces ::  98%|#########8| 30930/31509 [00:54<00:00, 680.64it/s]","\rparsing log, completed traces ::  98%|#########8| 31001/31509 [00:54<00:00, 687.52it/s]","\rparsing log, completed traces ::  99%|#########8| 31072/31509 [00:54<00:00, 693.32it/s]","\rparsing log, completed traces ::  99%|#########8| 31143/31509 [00:54<00:00, 691.55it/s]","\rparsing log, completed traces ::  99%|#########9| 31219/31509 [00:54<00:00, 709.33it/s]","\rparsing log, completed traces ::  99%|#########9| 31290/31509 [00:54<00:00, 667.30it/s]","\rparsing log, completed traces :: 100%|#########9| 31358/31509 [00:54<00:00, 660.42it/s]","\rparsing log, completed traces :: 100%|#########9| 31429/31509 [00:54<00:00, 672.89it/s]","\rparsing log, completed traces :: 100%|#########9| 31497/31509 [00:54<00:00, 659.35it/s]","","\rparsing log, completed traces :: 100%|##########| 31509/31509 [00:54<00:00, 574.00it/s]","\n","[data] Loading XES: /workspace/data/Road_Traffic_Fine_Management_Process.xes","\n","\rparsing log, completed traces ::   0%|          | 0/150370 [00:00<?, ?it/s]","\rparsing log, completed traces ::   1%|          | 756/150370 [00:00<00:19, 7540.12it/s]","\rparsing log, completed traces ::   1%|1         | 1574/150370 [00:00<00:18, 7878.00it/s]","\rparsing log, completed traces ::   2%|1         | 2383/150370 [00:00<00:18, 7973.92it/s]","\rparsing log, completed traces ::   2%|2         | 3181/150370 [00:00<00:18, 7938.32it/s]","\rparsing log, completed traces ::   3%|2         | 3984/150370 [00:00<00:18, 7971.20it/s]","\rparsing log, completed traces ::   3%|3         | 4782/150370 [00:00<00:18, 7960.41it/s]","\rparsing log, completed traces ::   4%|3         | 5585/150370 [00:00<00:18, 7982.21it/s]","\rparsing log, completed traces ::   4%|4         | 6384/150370 [00:00<00:18, 7932.17it/s]","\rparsing log, completed traces ::   5%|4         | 7178/150370 [00:01<00:30, 4653.86it/s]","\rparsing log, completed traces ::   5%|5         | 7969/150370 [00:01<00:26, 5326.03it/s]","\rparsing log, completed traces ::   6%|5         | 8805/150370 [00:01<00:23, 6005.56it/s]","\rparsing log, completed traces ::   6%|6         | 9643/150370 [00:01<00:21, 6572.97it/s]","\rparsing log, completed traces ::   7%|6         | 10437/150370 [00:01<00:20, 6926.75it/s]","\rparsing log, completed traces ::   7%|7         | 11243/150370 [00:01<00:19, 7232.11it/s]","\rparsing log, completed traces ::   8%|8         | 12051/150370 [00:01<00:18, 7468.03it/s]","\rparsing log, completed traces ::   9%|8         | 12839/150370 [00:01<00:18, 7561.81it/s]","\rparsing log, completed traces ::   9%|9         | 13639/150370 [00:01<00:17, 7687.41it/s]","\rparsing log, completed traces ::  10%|9         | 14429/150370 [00:02<00:17, 7728.79it/s]","\rparsing log, completed traces ::  10%|#         | 15228/150370 [00:02<00:17, 7803.92it/s]","\rparsing log, completed traces ::  11%|#         | 16069/150370 [00:02<00:16, 7981.77it/s]","\rparsing log, completed traces ::  11%|#1        | 16917/150370 [00:02<00:16, 8107.14it/s]","\rparsing log, completed traces ::  12%|#1        | 17734/150370 [00:02<00:30, 4411.47it/s]","\rparsing log, completed traces ::  12%|#2        | 18550/150370 [00:02<00:25, 5113.56it/s]","\rparsing log, completed traces ::  13%|#2        | 19351/150370 [00:02<00:22, 5724.88it/s]","\rparsing log, completed traces ::  13%|#3        | 20168/150370 [00:03<00:20, 6289.56it/s]","\rparsing log, completed traces ::  14%|#3        | 20981/150370 [00:03<00:19, 6746.04it/s]","\rparsing log, completed traces ::  15%|#4        | 21870/150370 [00:03<00:17, 7304.98it/s]","\rparsing log, completed traces ::  15%|#5        | 22750/150370 [00:03<00:16, 7711.89it/s]","\rparsing log, completed traces ::  16%|#5        | 23582/150370 [00:03<00:16, 7880.28it/s]","\rparsing log, completed traces ::  16%|#6        | 24411/150370 [00:03<00:16, 7456.14it/s]","\rparsing log, completed traces ::  17%|#6        | 25190/150370 [00:03<00:17, 7187.77it/s]","\rparsing log, completed traces ::  17%|#7        | 25933/150370 [00:03<00:17, 7035.78it/s]","\rparsing log, completed traces ::  18%|#7        | 26653/150370 [00:03<00:18, 6801.81it/s]","\rparsing log, completed traces ::  18%|#8        | 27345/150370 [00:03<00:18, 6750.51it/s]","\rparsing log, completed traces ::  19%|#8        | 28028/150370 [00:04<00:18, 6635.03it/s]","\rparsing log, completed traces ::  19%|#9        | 28697/150370 [00:04<00:33, 3599.90it/s]","\rparsing log, completed traces ::  20%|#9        | 29488/150370 [00:04<00:27, 4367.39it/s]","\rparsing log, completed traces ::  20%|##        | 30203/150370 [00:04<00:24, 4930.41it/s]","\rparsing log, completed traces ::  21%|##        | 30885/150370 [00:04<00:22, 5342.17it/s]","\rparsing log, completed traces ::  21%|##        | 31552/150370 [00:04<00:20, 5663.21it/s]","\rparsing log, completed traces ::  21%|##1       | 32240/150370 [00:05<00:19, 5973.69it/s]","\rparsing log, completed traces ::  22%|##1       | 32914/150370 [00:05<00:19, 6178.10it/s]","\rparsing log, completed traces ::  22%|##2       | 33596/150370 [00:05<00:18, 6356.09it/s]","\rparsing log, completed traces ::  23%|##2       | 34274/150370 [00:05<00:17, 6476.00it/s]","\rparsing log, completed traces ::  23%|##3       | 34948/150370 [00:05<00:17, 6551.28it/s]","\rparsing log, completed traces ::  24%|##3       | 35627/150370 [00:05<00:17, 6620.53it/s]","\rparsing log, completed traces ::  24%|##4       | 36315/150370 [00:05<00:17, 6695.42it/s]","\rparsing log, completed traces ::  25%|##4       | 37011/150370 [00:05<00:16, 6772.57it/s]","\rparsing log, completed traces ::  25%|##5       | 37705/150370 [00:05<00:16, 6822.06it/s]","\rparsing log, completed traces ::  26%|##5       | 38422/150370 [00:05<00:16, 6925.15it/s]","\rparsing log, completed traces ::  26%|##6       | 39140/150370 [00:06<00:15, 7001.03it/s]","\rparsing log, completed traces ::  27%|##6       | 39872/150370 [00:06<00:15, 7095.51it/s]","\rparsing log, completed traces ::  27%|##6       | 40584/150370 [00:06<00:32, 3370.22it/s]","\rparsing log, completed traces ::  27%|##7       | 41324/150370 [00:06<00:26, 4049.58it/s]","\rparsing log, completed traces ::  28%|##7       | 42083/150370 [00:06<00:22, 4736.01it/s]","\rparsing log, completed traces ::  28%|##8       | 42823/150370 [00:06<00:20, 5314.31it/s]","\rparsing log, completed traces ::  29%|##8       | 43587/150370 [00:06<00:18, 5864.14it/s]","\rparsing log, completed traces ::  29%|##9       | 44329/150370 [00:07<00:16, 6256.54it/s]","\rparsing log, completed traces ::  30%|##9       | 45055/150370 [00:07<00:16, 6522.64it/s]","\rparsing log, completed traces ::  30%|###       | 45794/150370 [00:07<00:15, 6760.03it/s]","\rparsing log, completed traces ::  31%|###       | 46519/150370 [00:07<00:15, 6859.68it/s]","\rparsing log, completed traces ::  31%|###1      | 47240/150370 [00:07<00:14, 6889.89it/s]","\rparsing log, completed traces ::  32%|###1      | 47983/150370 [00:07<00:14, 7045.35it/s]","\rparsing log, completed traces ::  32%|###2      | 48759/150370 [00:07<00:14, 7240.60it/s]","\rparsing log, completed traces ::  33%|###2      | 49571/150370 [00:07<00:13, 7485.40it/s]","\rparsing log, completed traces ::  33%|###3      | 50329/150370 [00:07<00:13, 7488.42it/s]","\rparsing log, completed traces ::  34%|###3      | 51085/150370 [00:07<00:13, 7470.02it/s]","\rparsing log, completed traces ::  34%|###4      | 51837/150370 [00:08<00:13, 7454.63it/s]","\rparsing log, completed traces ::  35%|###4      | 52586/150370 [00:08<00:13, 7437.26it/s]","\rparsing log, completed traces ::  35%|###5      | 53332/150370 [00:08<00:13, 7401.79it/s]","\rparsing log, completed traces ::  36%|###5      | 54086/150370 [00:08<00:12, 7442.41it/s]","\rparsing log, completed traces ::  37%|###6      | 54901/150370 [00:08<00:12, 7636.58it/s]","\rparsing log, completed traces ::  37%|###7      | 55666/150370 [00:09<00:28, 3381.56it/s]","\rparsing log, completed traces ::  38%|###7      | 56471/150370 [00:09<00:22, 4121.10it/s]","\rparsing log, completed traces ::  38%|###8      | 57253/150370 [00:09<00:19, 4802.65it/s]","\rparsing log, completed traces ::  39%|###8      | 58018/150370 [00:09<00:17, 5395.87it/s]","\rparsing log, completed traces ::  39%|###9      | 58754/150370 [00:09<00:15, 5838.03it/s]","\rparsing log, completed traces ::  40%|###9      | 59484/150370 [00:09<00:14, 6198.41it/s]","\rparsing log, completed traces ::  40%|####      | 60233/150370 [00:09<00:13, 6533.63it/s]","\rparsing log, completed traces ::  41%|####      | 61042/150370 [00:09<00:12, 6947.01it/s]","\rparsing log, completed traces ::  41%|####1     | 61861/150370 [00:09<00:12, 7276.59it/s]","\rparsing log, completed traces ::  42%|####1     | 62644/150370 [00:09<00:11, 7415.07it/s]","\rparsing log, completed traces ::  42%|####2     | 63416/150370 [00:10<00:11, 7418.75it/s]","\rparsing log, completed traces ::  43%|####2     | 64180/150370 [00:10<00:11, 7425.81it/s]","\rparsing log, completed traces ::  43%|####3     | 64941/150370 [00:10<00:11, 7477.64it/s]","\rparsing log, completed traces ::  44%|####3     | 65734/150370 [00:10<00:11, 7588.59it/s]","\rparsing log, completed traces ::  44%|####4     | 66501/150370 [00:10<00:11, 7579.05it/s]","\rparsing log, completed traces ::  45%|####4     | 67294/150370 [00:10<00:10, 7676.90it/s]","\rparsing log, completed traces ::  45%|####5     | 68150/150370 [00:10<00:10, 7938.84it/s]","\rparsing log, completed traces ::  46%|####5     | 68947/150370 [00:10<00:10, 7912.54it/s]","\rparsing log, completed traces ::  46%|####6     | 69741/150370 [00:10<00:10, 7858.45it/s]","\rparsing log, completed traces ::  47%|####6     | 70529/150370 [00:10<00:10, 7852.02it/s]","\rparsing log, completed traces ::  47%|####7     | 71316/150370 [00:11<00:10, 7856.81it/s]","\rparsing log, completed traces ::  48%|####7     | 72103/150370 [00:11<00:10, 7801.97it/s]","\rparsing log, completed traces ::  48%|####8     | 72884/150370 [00:11<00:09, 7782.54it/s]","\rparsing log, completed traces ::  49%|####8     | 73663/150370 [00:11<00:10, 7585.31it/s]","\rparsing log, completed traces ::  49%|####9     | 74423/150370 [00:11<00:23, 3175.71it/s]","\rparsing log, completed traces ::  50%|#####     | 75277/150370 [00:12<00:18, 3974.55it/s]","\rparsing log, completed traces ::  51%|#####     | 76078/150370 [00:12<00:15, 4675.56it/s]","\rparsing log, completed traces ::  51%|#####1    | 76904/150370 [00:12<00:13, 5392.60it/s]","\rparsing log, completed traces ::  52%|#####1    | 77673/150370 [00:12<00:12, 5902.63it/s]","\rparsing log, completed traces ::  52%|#####2    | 78440/150370 [00:12<00:11, 6327.53it/s]","\rparsing log, completed traces ::  53%|#####2    | 79231/150370 [00:12<00:10, 6732.76it/s]","\rparsing log, completed traces ::  53%|#####3    | 80009/150370 [00:12<00:10, 7012.33it/s]","\rparsing log, completed traces ::  54%|#####3    | 80780/150370 [00:12<00:09, 7189.82it/s]","\rparsing log, completed traces ::  54%|#####4    | 81557/150370 [00:12<00:09, 7353.58it/s]","\rparsing log, completed traces ::  55%|#####4    | 82397/150370 [00:12<00:08, 7640.34it/s]","\rparsing log, completed traces ::  55%|#####5    | 83229/150370 [00:13<00:08, 7837.85it/s]","\rparsing log, completed traces ::  56%|#####5    | 84032/150370 [00:13<00:08, 7870.22it/s]","\rparsing log, completed traces ::  56%|#####6    | 84832/150370 [00:13<00:08, 7845.08it/s]","\rparsing log, completed traces ::  57%|#####6    | 85626/150370 [00:13<00:08, 7814.49it/s]","\rparsing log, completed traces ::  57%|#####7    | 86428/150370 [00:13<00:08, 7874.38it/s]","\rparsing log, completed traces ::  58%|#####8    | 87237/150370 [00:13<00:07, 7937.92it/s]","\rparsing log, completed traces ::  59%|#####8    | 88037/150370 [00:13<00:07, 7955.33it/s]","\rparsing log, completed traces ::  59%|#####9    | 88845/150370 [00:13<00:07, 7992.33it/s]","\rparsing log, completed traces ::  60%|#####9    | 89664/150370 [00:13<00:07, 8050.16it/s]","\rparsing log, completed traces ::  60%|######    | 90477/150370 [00:13<00:07, 8072.24it/s]","\rparsing log, completed traces ::  61%|######    | 91287/150370 [00:14<00:07, 8078.44it/s]","\rparsing log, completed traces ::  61%|######1   | 92096/150370 [00:14<00:07, 8078.95it/s]","\rparsing log, completed traces ::  62%|######1   | 92905/150370 [00:14<00:07, 8035.58it/s]","\rparsing log, completed traces ::  62%|######2   | 93709/150370 [00:14<00:07, 8032.41it/s]","\rparsing log, completed traces ::  63%|######2   | 94535/150370 [00:14<00:06, 8099.94it/s]","\rparsing log, completed traces ::  63%|######3   | 95346/150370 [00:15<00:17, 3060.83it/s]","\rparsing log, completed traces ::  64%|######3   | 96127/150370 [00:15<00:14, 3720.60it/s]","\rparsing log, completed traces ::  64%|######4   | 96902/150370 [00:15<00:12, 4387.40it/s]","\rparsing log, completed traces ::  65%|######4   | 97674/150370 [00:15<00:10, 5024.51it/s]","\rparsing log, completed traces ::  65%|######5   | 98472/150370 [00:15<00:09, 5658.70it/s]","\rparsing log, completed traces ::  66%|######6   | 99273/150370 [00:15<00:08, 6209.69it/s]","\rparsing log, completed traces ::  67%|######6   | 100054/150370 [00:15<00:07, 6595.86it/s]","\rparsing log, completed traces ::  67%|######7   | 100857/150370 [00:15<00:07, 6971.46it/s]","\rparsing log, completed traces ::  68%|######7   | 101666/150370 [00:15<00:06, 7275.53it/s]","\rparsing log, completed traces ::  68%|######8   | 102471/150370 [00:15<00:06, 7488.80it/s]","\rparsing log, completed traces ::  69%|######8   | 103262/150370 [00:16<00:06, 7596.07it/s]","\rparsing log, completed traces ::  69%|######9   | 104052/150370 [00:16<00:06, 7665.41it/s]","\rparsing log, completed traces ::  70%|######9   | 104840/150370 [00:16<00:05, 7674.89it/s]","\rparsing log, completed traces ::  70%|#######   | 105623/150370 [00:16<00:05, 7717.10it/s]","\rparsing log, completed traces ::  71%|#######   | 106406/150370 [00:16<00:05, 7722.85it/s]","\rparsing log, completed traces ::  71%|#######1  | 107186/150370 [00:16<00:05, 7716.03it/s]","\rparsing log, completed traces ::  72%|#######1  | 107963/150370 [00:16<00:05, 7708.26it/s]","\rparsing log, completed traces ::  72%|#######2  | 108738/150370 [00:16<00:05, 7701.96it/s]","\rparsing log, completed traces ::  73%|#######2  | 109514/150370 [00:16<00:05, 7718.91it/s]","\rparsing log, completed traces ::  73%|#######3  | 110288/150370 [00:16<00:05, 7632.46it/s]","\rparsing log, completed traces ::  74%|#######3  | 111077/150370 [00:17<00:05, 7706.97it/s]","\rparsing log, completed traces ::  74%|#######4  | 111862/150370 [00:17<00:04, 7749.37it/s]","\rparsing log, completed traces ::  75%|#######4  | 112638/150370 [00:17<00:04, 7646.52it/s]","\rparsing log, completed traces ::  75%|#######5  | 113404/150370 [00:17<00:04, 7648.86it/s]","\rparsing log, completed traces ::  76%|#######6  | 114343/150370 [00:17<00:04, 8163.98it/s]","\rparsing log, completed traces ::  77%|#######6  | 115287/150370 [00:17<00:04, 8543.77it/s]","\rparsing log, completed traces ::  77%|#######7  | 116211/150370 [00:17<00:03, 8750.35it/s]","\rparsing log, completed traces ::  78%|#######7  | 117286/150370 [00:17<00:03, 9346.57it/s]","\rparsing log, completed traces ::  79%|#######8  | 118222/150370 [00:17<00:03, 8676.30it/s]","\rparsing log, completed traces ::  79%|#######9  | 119100/150370 [00:18<00:10, 3029.43it/s]","\rparsing log, completed traces ::  80%|#######9  | 119819/150370 [00:18<00:08, 3543.76it/s]","\rparsing log, completed traces ::  80%|########  | 120548/150370 [00:18<00:07, 4106.18it/s]","\rparsing log, completed traces ::  81%|########  | 121267/150370 [00:18<00:06, 4649.61it/s]","\rparsing log, completed traces ::  81%|########1 | 121997/150370 [00:19<00:05, 5182.76it/s]","\rparsing log, completed traces ::  82%|########1 | 122735/150370 [00:19<00:04, 5672.17it/s]","\rparsing log, completed traces ::  82%|########2 | 123464/150370 [00:19<00:04, 6063.48it/s]","\rparsing log, completed traces ::  83%|########2 | 124184/150370 [00:19<00:04, 6336.99it/s]","\rparsing log, completed traces ::  83%|########3 | 124902/150370 [00:19<00:03, 6542.32it/s]","\rparsing log, completed traces ::  84%|########3 | 125639/150370 [00:19<00:03, 6770.60it/s]","\rparsing log, completed traces ::  84%|########4 | 126371/150370 [00:19<00:03, 6923.42it/s]","\rparsing log, completed traces ::  85%|########4 | 127130/150370 [00:19<00:03, 7107.83it/s]","\rparsing log, completed traces ::  85%|########5 | 127873/150370 [00:19<00:03, 7201.43it/s]","\rparsing log, completed traces ::  86%|########5 | 128625/150370 [00:19<00:02, 7289.86it/s]","\rparsing log, completed traces ::  86%|########6 | 129381/150370 [00:20<00:02, 7356.36it/s]","\rparsing log, completed traces ::  87%|########6 | 130131/150370 [00:20<00:02, 7383.98it/s]","\rparsing log, completed traces ::  87%|########7 | 130892/150370 [00:20<00:02, 7435.82it/s]","\rparsing log, completed traces ::  88%|########7 | 131669/150370 [00:20<00:02, 7535.20it/s]","\rparsing log, completed traces ::  88%|########8 | 132449/150370 [00:20<00:02, 7611.94it/s]","\rparsing log, completed traces ::  89%|########8 | 133300/150370 [00:20<00:02, 7879.42it/s]","\rparsing log, completed traces ::  89%|########9 | 134090/150370 [00:20<00:02, 7797.94it/s]","\rparsing log, completed traces ::  90%|########9 | 134872/150370 [00:20<00:02, 7746.45it/s]","\rparsing log, completed traces ::  90%|######### | 135648/150370 [00:20<00:01, 7652.96it/s]","\rparsing log, completed traces ::  91%|######### | 136415/150370 [00:21<00:01, 7565.93it/s]","\rparsing log, completed traces ::  91%|#########1| 137173/150370 [00:21<00:01, 7498.47it/s]","\rparsing log, completed traces ::  92%|#########1| 137924/150370 [00:21<00:01, 7453.64it/s]","\rparsing log, completed traces ::  92%|#########2| 138678/150370 [00:21<00:01, 7477.18it/s]","\rparsing log, completed traces ::  93%|#########2| 139428/150370 [00:21<00:01, 7482.93it/s]","\rparsing log, completed traces ::  93%|#########3| 140177/150370 [00:21<00:01, 7478.24it/s]","\rparsing log, completed traces ::  94%|#########3| 140964/150370 [00:21<00:01, 7592.62it/s]","\rparsing log, completed traces ::  94%|#########4| 141743/150370 [00:21<00:01, 7650.41it/s]","\rparsing log, completed traces ::  95%|#########4| 142509/150370 [00:21<00:01, 7644.57it/s]","\rparsing log, completed traces ::  95%|#########5| 143274/150370 [00:21<00:00, 7629.44it/s]","\rparsing log, completed traces ::  96%|#########5| 144042/150370 [00:22<00:00, 7637.04it/s]","\rparsing log, completed traces ::  96%|#########6| 144806/150370 [00:22<00:00, 7591.06it/s]","\rparsing log, completed traces ::  97%|#########6| 145566/150370 [00:22<00:02, 2355.48it/s]","\rparsing log, completed traces ::  97%|#########7| 146154/150370 [00:23<00:01, 2766.47it/s]","\rparsing log, completed traces ::  98%|#########7| 146772/150370 [00:23<00:01, 3253.93it/s]","\rparsing log, completed traces ::  98%|#########8| 147375/150370 [00:23<00:00, 3724.03it/s]","\rparsing log, completed traces ::  98%|#########8| 147976/150370 [00:23<00:00, 4163.40it/s]","\rparsing log, completed traces ::  99%|#########8| 148614/150370 [00:23<00:00, 4645.39it/s]","\rparsing log, completed traces ::  99%|#########9| 149281/150370 [00:23<00:00, 5125.30it/s]","\rparsing log, completed traces :: 100%|#########9| 149993/150370 [00:23<00:00, 5628.65it/s]","","\rparsing log, completed traces :: 100%|##########| 150370/150370 [00:23<00:00, 6339.97it/s]","\n","[data] Loaded datasets: ['BPI2012', 'BPI2017', 'ROAD']","\n","\n=== Dataset: BPI2012 ===","\n","Samples train/val/test: 22252/4176/4196; vocab=23","\n","Epoch 1: validation_loss = 0.5594 | val_acc=0.7409 | val_f1=0.5316 | val_top3=0.9840","\n","Epoch 2: validation_loss = 0.5308 | val_acc=0.7598 | val_f1=0.5425 | val_top3=0.9854","\n","Epoch 3: validation_loss = 0.5333 | val_acc=0.7574 | val_f1=0.5725 | val_top3=0.9859","\n","Epoch 4: validation_loss = 0.5195 | val_acc=0.7629 | val_f1=0.5835 | val_top3=0.9861","\n","Epoch 5: validation_loss = 0.5221 | val_acc=0.7450 | val_f1=0.6007 | val_top3=0.9854","\n","Epoch 6: validation_loss = 0.5249 | val_acc=0.7634 | val_f1=0.5833 | val_top3=0.9861","\n","Epoch 7: validation_loss = 0.5073 | val_acc=0.7639 | val_f1=0.5909 | val_top3=0.9856","\n","Epoch 8: validation_loss = 0.5113 | val_acc=0.7593 | val_f1=0.5790 | val_top3=0.9859","\n","Epoch 9: validation_loss = 0.5105 | val_acc=0.7639 | val_f1=0.5842 | val_top3=0.9852","\n","Epoch 10: validation_loss = 0.5201 | val_acc=0.7634 | val_f1=0.5797 | val_top3=0.9847","\n","[BPI2012] Train: loss=0.5148 acc=0.7777 f1=0.5609 top3=0.9868","\n","[BPI2012] Test:  loss=0.5355 acc=0.7569 f1=0.5872 top3=0.9874","\n","\n=== Dataset: BPI2017 ===","\n","Samples train/val/test: 34519/7403/7374; vocab=24","\n","Epoch 1: validation_loss = 0.4172 | val_acc=0.8368 | val_f1=0.5299 | val_top3=0.9904","\n","Epoch 2: validation_loss = 0.4004 | val_acc=0.8367 | val_f1=0.5595 | val_top3=0.9907","\n","Epoch 3: validation_loss = 0.3864 | val_acc=0.8384 | val_f1=0.5719 | val_top3=0.9912","\n","Epoch 4: validation_loss = 0.3847 | val_acc=0.8395 | val_f1=0.5903 | val_top3=0.9919","\n","Epoch 5: validation_loss = 0.3812 | val_acc=0.8405 | val_f1=0.5856 | val_top3=0.9922","\n","Epoch 6: validation_loss = 0.3802 | val_acc=0.8376 | val_f1=0.5896 | val_top3=0.9916","\n","Epoch 7: validation_loss = 0.3769 | val_acc=0.8361 | val_f1=0.5957 | val_top3=0.9924","\n","Epoch 8: validation_loss = 0.3799 | val_acc=0.8386 | val_f1=0.6180 | val_top3=0.9927","\n","Epoch 9: validation_loss = 0.3805 | val_acc=0.8391 | val_f1=0.5989 | val_top3=0.9926","\n","Epoch 10: validation_loss = 0.3756 | val_acc=0.8399 | val_f1=0.6155 | val_top3=0.9928","\n","[BPI2017] Train: loss=0.3607 acc=0.8422 f1=0.5721 top3=0.9941","\n","[BPI2017] Test:  loss=0.3877 acc=0.8332 f1=0.5710 top3=0.9906","\n","\n=== Dataset: ROAD ===","\n","Samples train/val/test: 8707/1928/1869; vocab=11","\n","Epoch 1: validation_loss = 0.4913 | val_acc=0.7993 | val_f1=0.3684 | val_top3=0.9922","\n","Epoch 2: validation_loss = 0.4561 | val_acc=0.8086 | val_f1=0.4514 | val_top3=0.9948","\n","Epoch 3: validation_loss = 0.4566 | val_acc=0.8091 | val_f1=0.5300 | val_top3=0.9969","\n","Epoch 4: validation_loss = 0.4482 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 5: validation_loss = 0.4355 | val_acc=0.8112 | val_f1=0.6427 | val_top3=0.9969","\n","Epoch 6: validation_loss = 0.4334 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 7: validation_loss = 0.4328 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 8: validation_loss = 0.4334 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 9: validation_loss = 0.4274 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 10: validation_loss = 0.4329 | val_acc=0.8122 | val_f1=0.6664 | val_top3=0.9969","\n","[ROAD] Train: loss=0.4662 acc=0.7894 f1=0.5395 top3=0.9986","\n","[ROAD] Test:  loss=0.4833 acc=0.8020 f1=0.4740 top3=0.9936","\n","Execution time: 3 minutes seconds (time limit is an hour)."],"parse_metrics_plan":"I will load the numpy file from the specified working directory, parse the nested experiment_data structure, and compute final or best metrics as requested. For training and test, I will report the final metrics saved in the structure. For validation, I will compute the best values across epochs for accuracy, F1 score, and top-3 accuracy, and the minimum validation loss using the recorded loss history. The script prints the dataset name followed by clearly labeled metrics and executes immediately.","parse_metrics_code":"import os\nimport numpy as np\n\n\ndef safe_get(d, *keys, default=None):\n    cur = d\n    for k in keys:\n        if isinstance(cur, dict) and k in cur:\n            cur = cur[k]\n        else:\n            return default\n    return cur\n\n\ndef load_experiment_data():\n    working_dir = os.path.join(os.getcwd(), \"working\")\n    path = os.path.join(working_dir, \"experiment_data.npy\")\n    if not os.path.isfile(path):\n        raise FileNotFoundError(f\"File not found: {path}\")\n    data = np.load(path, allow_pickle=True).item()\n    if not isinstance(data, dict):\n        raise ValueError(\"Loaded experiment_data is not a dict.\")\n    return data\n\n\ndef extract_final_train_metrics(ds_data):\n    # Expect a 'final' entry\n    train_entries = safe_get(ds_data, \"metrics\", \"train\", default=[])\n    final = None\n    for tag, vals in train_entries:\n        if tag == \"final\":\n            final = vals\n    out = {}\n    if final:\n        out[\"train loss\"] = final.get(\"loss\", None)\n        out[\"train accuracy\"] = final.get(\"acc\", None)\n        out[\"train F1 score\"] = final.get(\"macro_f1\", None)\n        out[\"train top-3 accuracy\"] = final.get(\"top3\", None)\n    else:\n        # Fallback: try last value from losses for loss only\n        train_losses = safe_get(ds_data, \"losses\", \"train\", default=[])\n        if train_losses:\n            out[\"train loss\"] = train_losses[-1][1]\n    return out\n\n\ndef extract_best_val_metrics(ds_data):\n    # Collect per-epoch validation metrics (acc, macro_f1, top3)\n    val_entries = safe_get(ds_data, \"metrics\", \"val\", default=[])\n    best = {\n        \"validation accuracy\": None,\n        \"validation F1 score\": None,\n        \"validation top-3 accuracy\": None,\n    }\n    for tag, vals in val_entries:\n        if isinstance(vals, dict):\n            acc = vals.get(\"acc\", None)\n            f1 = vals.get(\"macro_f1\", None)\n            top3 = vals.get(\"top3\", None)\n            if acc is not None:\n                best[\"validation accuracy\"] = (\n                    acc\n                    if best[\"validation accuracy\"] is None\n                    else max(best[\"validation accuracy\"], acc)\n                )\n            if f1 is not None:\n                best[\"validation F1 score\"] = (\n                    f1\n                    if best[\"validation F1 score\"] is None\n                    else max(best[\"validation F1 score\"], f1)\n                )\n            if top3 is not None:\n                best[\"validation top-3 accuracy\"] = (\n                    top3\n                    if best[\"validation top-3 accuracy\"] is None\n                    else max(best[\"validation top-3 accuracy\"], top3)\n                )\n    # For validation loss, use recorded losses per epoch and take the minimum\n    val_losses = safe_get(ds_data, \"losses\", \"val\", default=[])\n    if val_losses:\n        min_val_loss = min((v for (_, v) in val_losses), default=None)\n    else:\n        # fallback: check 'final' val entry if present\n        min_val_loss = None\n        for tag, vals in val_entries:\n            if tag == \"final\" and isinstance(vals, dict):\n                min_val_loss = vals.get(\"loss\", None)\n                break\n    out = {\"validation loss\": min_val_loss}\n    out.update(best)\n    return out\n\n\ndef extract_final_test_metrics(ds_data):\n    test_entries = safe_get(ds_data, \"metrics\", \"test\", default=[])\n    final = None\n    for tag, vals in test_entries:\n        if tag == \"final\":\n            final = vals\n    out = {}\n    if final:\n        out[\"test loss\"] = final.get(\"loss\", None)\n        out[\"test accuracy\"] = final.get(\"acc\", None)\n        out[\"test F1 score\"] = final.get(\"macro_f1\", None)\n        out[\"test top-3 accuracy\"] = final.get(\"top3\", None)\n    return out\n\n\ndef format_print_metrics(dataset_name, metrics_dict):\n    print(dataset_name)\n    # Keep a consistent order for readability\n    ordered_keys = [\n        \"train loss\",\n        \"train accuracy\",\n        \"train F1 score\",\n        \"train top-3 accuracy\",\n        \"validation loss\",\n        \"validation accuracy\",\n        \"validation F1 score\",\n        \"validation top-3 accuracy\",\n        \"test loss\",\n        \"test accuracy\",\n        \"test F1 score\",\n        \"test top-3 accuracy\",\n    ]\n    printed_any = False\n    for k in ordered_keys:\n        if k in metrics_dict and metrics_dict[k] is not None:\n            val = metrics_dict[k]\n            if isinstance(val, float):\n                print(f\"{k}: {val:.4f}\")\n            else:\n                print(f\"{k}: {val}\")\n            printed_any = True\n    # Print any remaining keys that were not in the ordered list\n    for k, v in metrics_dict.items():\n        if k not in ordered_keys and v is not None:\n            if isinstance(v, float):\n                print(f\"{k}: {v:.4f}\")\n            else:\n                print(f\"{k}: {v}\")\n            printed_any = True\n    if not printed_any:\n        print(\"No metrics available\")\n\n\ndef run():\n    experiment_data = load_experiment_data()\n    for ds_name, ds_data in experiment_data.items():\n        all_metrics = {}\n        all_metrics.update(extract_final_train_metrics(ds_data))\n        all_metrics.update(extract_best_val_metrics(ds_data))\n        all_metrics.update(extract_final_test_metrics(ds_data))\n        format_print_metrics(ds_name, all_metrics)\n\n\n# Execute immediately\nrun()\n","parse_term_out":["BPI2012","\n","train loss: 0.5148","\n","train accuracy: 0.7777","\n","train F1 score: 0.5609","\n","train top-3 accuracy: 0.9868","\n","validation loss: 0.5073","\n","validation accuracy: 0.7639","\n","validation F1 score: 0.6007","\n","validation top-3 accuracy: 0.9861","\n","test loss: 0.5355","\n","test accuracy: 0.7569","\n","test F1 score: 0.5872","\n","test top-3 accuracy: 0.9874","\n","BPI2017","\n","train loss: 0.3607","\n","train accuracy: 0.8422","\n","train F1 score: 0.5721","\n","train top-3 accuracy: 0.9941","\n","validation loss: 0.3756","\n","validation accuracy: 0.8405","\n","validation F1 score: 0.6180","\n","validation top-3 accuracy: 0.9928","\n","test loss: 0.3877","\n","test accuracy: 0.8332","\n","test F1 score: 0.5710","\n","test top-3 accuracy: 0.9906","\n","ROAD","\n","train loss: 0.4662","\n","train accuracy: 0.7894","\n","train F1 score: 0.5395","\n","train top-3 accuracy: 0.9986","\n","validation loss: 0.4274","\n","validation accuracy: 0.8122","\n","validation F1 score: 0.6664","\n","validation top-3 accuracy: 0.9969","\n","test loss: 0.4833","\n","test accuracy: 0.8020","\n","test F1 score: 0.4740","\n","test top-3 accuracy: 0.9936","\n","Execution time: a moment seconds (time limit is an hour)."],"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":236.42285084724426,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"","exp_results_dir":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087","metric":{"value":{"metric_names":[{"metric_name":"loss","lower_is_better":true,"description":"Cross-entropy loss averaged over samples.","data":[{"dataset_name":"BPI2012 tr","final_value":0.5148,"best_value":0.5148},{"dataset_name":"BPI2012 dev","final_value":0.5073,"best_value":0.5073},{"dataset_name":"BPI2012 ts","final_value":0.5355,"best_value":0.5355},{"dataset_name":"BPI2017 tr","final_value":0.3607,"best_value":0.3607},{"dataset_name":"BPI2017 dev","final_value":0.3756,"best_value":0.3756},{"dataset_name":"BPI2017 ts","final_value":0.3877,"best_value":0.3877},{"dataset_name":"ROAD tr","final_value":0.4662,"best_value":0.4662},{"dataset_name":"ROAD dev","final_value":0.4274,"best_value":0.4274},{"dataset_name":"ROAD ts","final_value":0.4833,"best_value":0.4833}]},{"metric_name":"accuracy","lower_is_better":false,"description":"Top-1 classification accuracy.","data":[{"dataset_name":"BPI2012 tr","final_value":0.7777,"best_value":0.7777},{"dataset_name":"BPI2012 dev","final_value":0.7639,"best_value":0.7639},{"dataset_name":"BPI2012 ts","final_value":0.7569,"best_value":0.7569},{"dataset_name":"BPI2017 tr","final_value":0.8422,"best_value":0.8422},{"dataset_name":"BPI2017 dev","final_value":0.8405,"best_value":0.8405},{"dataset_name":"BPI2017 ts","final_value":0.8332,"best_value":0.8332},{"dataset_name":"ROAD tr","final_value":0.7894,"best_value":0.7894},{"dataset_name":"ROAD dev","final_value":0.8122,"best_value":0.8122},{"dataset_name":"ROAD ts","final_value":0.802,"best_value":0.802}]},{"metric_name":"F1 score","lower_is_better":false,"description":"Harmonic mean of precision and recall (macro/weighted not specified).","data":[{"dataset_name":"BPI2012 tr","final_value":0.5609,"best_value":0.5609},{"dataset_name":"BPI2012 dev","final_value":0.6007,"best_value":0.6007},{"dataset_name":"BPI2012 ts","final_value":0.5872,"best_value":0.5872},{"dataset_name":"BPI2017 tr","final_value":0.5721,"best_value":0.5721},{"dataset_name":"BPI2017 dev","final_value":0.618,"best_value":0.618},{"dataset_name":"BPI2017 ts","final_value":0.571,"best_value":0.571},{"dataset_name":"ROAD tr","final_value":0.5395,"best_value":0.5395},{"dataset_name":"ROAD dev","final_value":0.6664,"best_value":0.6664},{"dataset_name":"ROAD ts","final_value":0.474,"best_value":0.474}]},{"metric_name":"top-3 accuracy","lower_is_better":false,"description":"Fraction of samples where the correct label is among the top-3 predictions.","data":[{"dataset_name":"BPI2012 tr","final_value":0.9868,"best_value":0.9868},{"dataset_name":"BPI2012 dev","final_value":0.9861,"best_value":0.9861},{"dataset_name":"BPI2012 ts","final_value":0.9874,"best_value":0.9874},{"dataset_name":"BPI2017 tr","final_value":0.9941,"best_value":0.9941},{"dataset_name":"BPI2017 dev","final_value":0.9928,"best_value":0.9928},{"dataset_name":"BPI2017 ts","final_value":0.9906,"best_value":0.9906},{"dataset_name":"ROAD tr","final_value":0.9986,"best_value":0.9986},{"dataset_name":"ROAD dev","final_value":0.9969,"best_value":0.9969},{"dataset_name":"ROAD ts","final_value":0.9936,"best_value":0.9936}]}]},"maximize":null,"name":null,"description":null},"is_buggy":false,"is_buggy_plots":false,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":["../../logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/val_top3_BPI2017.png","../../logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/val_top3_BPI2012.png","../../logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/loss_curves_ROAD.png","../../logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/loss_curves_BPI2017.png","../../logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/val_top3_ROAD.png","../../logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/loss_curves_BPI2012.png"],"plot_paths":["experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/val_top3_BPI2017.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/val_top3_BPI2012.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/loss_curves_ROAD.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/loss_curves_BPI2017.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/val_top3_ROAD.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/loss_curves_BPI2012.png"],"plot_analyses":[{"analysis":"The validation top-3 accuracy for the BPI2017 dataset shows a consistent increase over the epochs, indicating that the model is effectively learning to predict the top-3 next activities over time. The accuracy surpasses 0.9925, which suggests strong predictive performance.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/val_top3_BPI2017.png"},{"analysis":"The validation top-3 accuracy for the BPI2012 dataset starts strong, reaching above 0.9860 early in training, but shows a slight decline towards the end of the epochs. This could indicate overfitting or a plateau in learning efficiency, requiring potential adjustments in model complexity or training duration.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/val_top3_BPI2012.png"},{"analysis":"The loss curves for the ROAD dataset show a clear and rapid decline in both training and validation loss. The validation loss stabilizes close to the training loss, indicating good generalization without significant overfitting. The model appears to be well-calibrated for this dataset.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/loss_curves_ROAD.png"},{"analysis":"The loss curves for the BPI2017 dataset demonstrate a sharp decline in both training and validation loss, with the validation loss closely following the training loss. This suggests effective learning and good model generalization with minimal overfitting.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/loss_curves_BPI2017.png"},{"analysis":"The validation top-3 accuracy for the ROAD dataset reaches a high value early on and remains stable throughout the epochs, indicating strong model performance and consistency in predicting the top-3 next activities. The accuracy remains nearly constant at around 0.997, reflecting excellent predictive capabilities.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/val_top3_ROAD.png"},{"analysis":"The loss curves for the BPI2012 dataset show a significant decrease in both training and validation loss with epochs, indicating effective learning. The validation loss is slightly higher than the training loss towards the end, suggesting minor overfitting that may be rectified with techniques such as dropout or regularization.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_726b2721d45c4800b9381c5d265fefcb_proc_332087/loss_curves_BPI2012.png"}],"vlm_feedback_summary":"The experimental results demonstrate strong predictive performance across different datasets, particularly in top-3 accuracy metrics. While the ROAD dataset shows excellent consistency and high accuracy, the BPI2012 dataset indicates potential overfitting concerns. Loss curves across datasets suggest good generalization capabilities, with minor overfitting observed in the BPI2012 dataset. Further refinement may be needed in model tuning and complexity to address these issues.","datasets_successfully_tested":["BPI2017","BPI2012","ROAD"],"ablation_name":null,"hyperparam_name":null,"is_seed_node":false,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"import os\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score, confusion_matrix\nimport random\nimport math\nimport glob\nfrom datetime import datetime\n\n# pm4py for XES loading\ntry:\n    import pm4py\n    from pm4py.objects.log.importer.xes import importer as xes_importer\n    from pm4py.objects.conversion.log import converter as log_converter\nexcept Exception as e:\n    raise ImportError(\n        \"pm4py is required to load XES files. Please install pm4py.\"\n    ) from e\n\n# Working directory\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\n# Device handling\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n# Experiment data structure (per instructions)\nexperiment_data = {\n    \"max_epochs_tuning\": {\n        # dataset_name: to be filled dynamically\n    }\n}\n\n\n# Reproducibility\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# Load XES datasets using pm4py from local directory \"data\"\ndef load_xes_datasets(data_dir=\"data\"):\n    datasets = {}\n    os.makedirs(data_dir, exist_ok=True)\n    xes_files = glob.glob(os.path.join(data_dir, \"*.xes\")) + glob.glob(\n        os.path.join(data_dir, \"*.xes.gz\")\n    )\n    if len(xes_files) == 0:\n        print(\n            f\"[warn] No XES files found in {data_dir}. Please place .xes or .xes.gz files there.\"\n        )\n        return datasets\n    for path in xes_files:\n        try:\n            log = xes_importer.apply(path)\n            df = pm4py.convert_to_dataframe(log)\n            # Standardize columns\n            # Common pm4py columns: case:concept:name, concept:name, time:timestamp, lifecycle:transition\n            if \"case:concept:name\" in df.columns:\n                df[\"case_id\"] = df[\"case:concept:name\"].astype(str)\n            elif \"case_id\" in df.columns:\n                df[\"case_id\"] = df[\"case_id\"].astype(str)\n            else:\n                # fallback - ensure a case grouping exists\n                df[\"case_id\"] = df.groupby(level=0).ngroup().astype(str)\n\n            if \"concept:name\" in df.columns:\n                df[\"activity\"] = df[\"concept:name\"].astype(str)\n            elif \"activity\" in df.columns:\n                df[\"activity\"] = df[\"activity\"].astype(str)\n            else:\n                # if missing, synthesize from event index\n                df[\"activity\"] = \"ACT\"\n\n            if \"time:timestamp\" in df.columns:\n                df[\"timestamp\"] = pd.to_datetime(df[\"time:timestamp\"], utc=True)\n            elif \"timestamp\" in df.columns:\n                df[\"timestamp\"] = pd.to_datetime(df[\"timestamp\"], utc=True)\n            else:\n                # fabricate timestamps if missing (not ideal)\n                df[\"timestamp\"] = pd.to_datetime(datetime.utcnow())\n\n            if \"lifecycle:transition\" in df.columns:\n                df[\"lifecycle\"] = df[\"lifecycle:transition\"].astype(str)\n            elif \"lifecycle\" in df.columns:\n                df[\"lifecycle\"] = df[\"lifecycle\"].astype(str)\n            # Keep only necessary columns\n            df_std = df[\n                [\"case_id\", \"activity\", \"timestamp\"]\n                + ([\"lifecycle\"] if \"lifecycle\" in df.columns else [])\n            ].copy()\n            name = os.path.splitext(os.path.basename(path))[0]\n            datasets[name] = df_std\n            print(\n                f\"Loaded {name}: {len(df_std)} events, {df_std['case_id'].nunique()} cases\"\n            )\n        except Exception as e:\n            print(f\"[warn] Failed to load {path}: {e}\")\n    return datasets\n\n\n# Build prefixes\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n        if len(df) == 0:\n            df = df.copy()\n            df = df.sort_values([\"case_id\", \"timestamp\"])\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}  # 0 for PAD\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        ts_ns = pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy()\n        ts = (ts_ns // 10**9).astype(np.int64)\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str).tolist()], dtype=np.int64\n        )\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            seq_acts = acts_ids[:k].tolist()\n            seq_feats = feats[:k]\n            target = int(acts_ids[k])\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": seq_acts,\n                    \"seq_feats\": seq_feats.copy(),\n                    \"target\": target,\n                    \"last_ts\": int(ts[k - 1]),\n                    \"next_ts\": int(ts[k]),\n                }\n            )\n\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n    ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n    for s in samples:\n        if s[\"seq_feats\"].shape[0] > 0:\n            s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n            s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\n# Time-based split by case start time\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"].astype(str))\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"].astype(str))\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"].astype(str))\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)  # includes PAD index\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    out = {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, preds_probs = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            preds_probs.append(probs.detach().cpu().numpy())\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys)\n    y_pred = np.array(preds_top1)\n    mask = y_true != pad_idx\n    y_true = y_true[mask]\n    y_pred = y_pred[mask]\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    probs_concat = (\n        np.concatenate(preds_probs, axis=0)\n        if len(preds_probs) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return avg_loss, acc, f1, top3, y_true, y_pred, probs_concat\n\n\ndef train_with_epoch_tuning(\n    name,\n    df,\n    base_epochs=30,\n    maybe_extend_to=50,\n    batch_size=128,\n    max_prefix_len=10,\n    lr=1e-3,\n):\n    print(f\"\\n=== Dataset: {name} ===\")\n    # Time-based split\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    # Build samples and vocab\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    # Filter splits\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # Recompute normalization using train samples only\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm_samples(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm_samples(samples_train)\n            norm_samples(samples_val)\n            norm_samples(samples_test)\n    print(\n        f\"Samples train/val/test: {len(samples_train)}/{len(samples_val)}/{len(samples_test)}; vocab={len(act2id)}\"\n    )\n    if len(samples_train) == 0 or len(act2id) < 2:\n        print(\"Not enough data to train. Skipping.\")\n        return None\n\n    ds_train = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_val = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_test = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=True,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_test = DataLoader(\n        ds_test,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n\n    # Model\n    model = LSTMBaseline(\n        vocab_size=len(act2id),\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    # Training with early stopping and potential extension\n    best_val_top3 = -1.0\n    best_state = None\n    best_epoch = 0\n    hist = {\"train_loss\": [], \"val_loss\": [], \"val_top3\": []}\n    patience = 8\n    no_improve = 0\n\n    def train_epochs(n_epochs, start_epoch_idx=0):\n        nonlocal best_val_top3, best_state, best_epoch, no_improve\n        for e in range(1, n_epochs + 1):\n            epoch = start_epoch_idx + e\n            model.train()\n            total = 0\n            running_loss = 0.0\n            for batch in dl_train:\n                batch = {\n                    k: v.to(device)\n                    for k, v in batch.items()\n                    if isinstance(v, torch.Tensor)\n                }\n                optimizer.zero_grad()\n                logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n                loss = criterion(logits, batch[\"y\"])\n                loss.backward()\n                optimizer.step()\n                running_loss += loss.item() * logits.size(0)\n                total += logits.size(0)\n            train_loss = running_loss / max(1, total)\n            val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n                model, dl_val, criterion, device, len(act2id), pad_id\n            )\n            print(\n                f\"Epoch {epoch}: val_loss={val_loss:.4f} | val_acc={val_acc:.4f} | val_f1={val_f1:.4f} | val_top3={val_top3:.4f}\"\n            )\n            hist[\"train_loss\"].append(train_loss)\n            hist[\"val_loss\"].append(val_loss)\n            hist[\"val_top3\"].append(val_top3)\n            if val_top3 > best_val_top3 + 1e-6:\n                best_val_top3 = val_top3\n                best_state = {k: v.cpu().clone() for k, v in model.state_dict().items()}\n                best_epoch = epoch\n                no_improve = 0\n            else:\n                no_improve += 1\n            # Early stopping within phase\n            if no_improve >= patience:\n                print(f\"Early stopping (no improvement in {patience} epochs).\")\n                break\n        return start_epoch_idx + len(hist[\"train_loss\"])\n\n    # Phase 1: up to base_epochs\n    last_epoch = train_epochs(base_epochs, start_epoch_idx=0)\n\n    # Decide whether to extend to maybe_extend_to\n    def should_extend(val_top3_hist, base_epochs):\n        if len(val_top3_hist) < 10:\n            return False\n        # If best near the end and upward trend over last 5 epochs\n        last5 = val_top3_hist[-5:]\n        prev5 = val_top3_hist[-10:-5]\n        if len(prev5) < 5:\n            return False\n        mean_gain = np.mean(last5) - np.mean(prev5)\n        condition = (best_epoch >= max(1, base_epochs - 3)) and (mean_gain > 0.002)\n        return condition\n\n    if should_extend(hist[\"val_top3\"], base_epochs) and maybe_extend_to > base_epochs:\n        print(\n            f\"Extending training to {maybe_extend_to} epochs due to improving validation top-3.\"\n        )\n        # Restore best before continuing to ensure good starting point\n        if best_state is not None:\n            model.load_state_dict(best_state)\n            model.to(device)\n        # Reset patience counter for extension\n        no_improve = 0\n        extra_epochs = maybe_extend_to - len(hist[\"train_loss\"])\n        if extra_epochs > 0:\n            last_epoch = train_epochs(\n                extra_epochs, start_epoch_idx=len(hist[\"train_loss\"])\n            )\n\n    # Load best checkpoint\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n\n    # Final evaluations\n    train_loss, train_acc, train_f1, train_top3, _, _, _ = evaluate(\n        model, dl_train, criterion, device, len(act2id), pad_id\n    )\n    val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n        model, dl_val, criterion, device, len(act2id), pad_id\n    )\n    test_loss, test_acc, test_f1, test_top3, y_true_t, y_pred_t, probs_t = evaluate(\n        model, dl_test, criterion, device, len(act2id), pad_id\n    )\n\n    print(\n        f\"[{name}] Train: loss={train_loss:.4f} acc={train_acc:.4f} f1={train_f1:.4f} top3={train_top3:.4f}\"\n    )\n    print(\n        f\"[{name}] Test:  loss={test_loss:.4f} acc={test_acc:.4f} f1={test_f1:.4f} top3={test_top3:.4f}\"\n    )\n\n    # Prepare results dict for this dataset\n    results = {\n        \"metrics\": {\n            \"train\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": train_loss,\n                        \"acc\": train_acc,\n                        \"macro_f1\": train_f1,\n                        \"top3\": train_top3,\n                    },\n                )\n            ],\n            \"val\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": val_loss,\n                        \"acc\": val_acc,\n                        \"macro_f1\": val_f1,\n                        \"top3\": val_top3,\n                    },\n                )\n            ],\n            \"test\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": test_loss,\n                        \"acc\": test_acc,\n                        \"macro_f1\": test_f1,\n                        \"top3\": test_top3,\n                    },\n                )\n            ],\n        },\n        \"losses\": {\n            \"train\": list(enumerate(hist[\"train_loss\"], start=1)),\n            \"val\": list(enumerate(hist[\"val_loss\"], start=1)),\n        },\n        \"val_top3_curve\": list(enumerate(hist[\"val_top3\"], start=1)),\n        \"predictions\": y_pred_t.tolist(),\n        \"ground_truth\": y_true_t.tolist(),\n        \"epochs_trained\": len(hist[\"train_loss\"]),\n        \"best_val_top3\": best_val_top3,\n        \"best_epoch\": best_epoch,\n        \"vocab_size\": len(act2id),\n        \"pad_idx\": pad_id,\n    }\n\n    # Save plottable data as numpy arrays\n    np.save(\n        os.path.join(working_dir, f\"{name}_train_loss.npy\"),\n        np.array(hist[\"train_loss\"], dtype=np.float32),\n    )\n    np.save(\n        os.path.join(working_dir, f\"{name}_val_loss.npy\"),\n        np.array(hist[\"val_loss\"], dtype=np.float32),\n    )\n    np.save(\n        os.path.join(working_dir, f\"{name}_val_top3.npy\"),\n        np.array(hist[\"val_top3\"], dtype=np.float32),\n    )\n    np.save(os.path.join(working_dir, f\"{name}_y_true.npy\"), y_true_t.astype(np.int64))\n    np.save(os.path.join(working_dir, f\"{name}_y_pred.npy\"), y_pred_t.astype(np.int64))\n    try:\n        cm = confusion_matrix(y_true_t, y_pred_t)\n        np.save(os.path.join(working_dir, f\"{name}_confusion_matrix.npy\"), cm)\n    except Exception as e:\n        print(f\"[warn] Confusion matrix failed: {e}\")\n\n    return results\n\n\ndef main():\n    datasets = load_xes_datasets(data_dir=\"data\")\n    # If no datasets found, exit gracefully after saving empty experiment_data\n    if len(datasets) == 0:\n        np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n        print(\"No datasets found. Exiting.\")\n        return\n    # Train each dataset (cap earliest 5000 cases for speed)\n    for key, df in datasets.items():\n        try:\n            starts = (\n                df.sort_values(\"timestamp\")\n                .groupby(\"case_id\")[\"timestamp\"]\n                .min()\n                .reset_index()\n            )\n            if len(starts) > 5000:\n                keep_cases = set(starts.iloc[:5000][\"case_id\"])\n                df_small = df[df[\"case_id\"].isin(keep_cases)].copy()\n            else:\n                df_small = df\n        except Exception:\n            df_small = df\n        res = train_with_epoch_tuning(\n            key,\n            df_small,\n            base_epochs=30,\n            maybe_extend_to=50,\n            batch_size=128,\n            max_prefix_len=10,\n            lr=1e-3,\n        )\n        if res is not None:\n            experiment_data[\"max_epochs_tuning\"][key] = res\n\n    # Save consolidated experiment data (use mandated filename)\n    np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n\n\n# Execute\nif __name__ == \"__main__\":\n    main()\n","plan":"Hyperparam tuning name: max_epochs.\nPlan: Replace dataset loader with a pm4py-based XES loader that scans a local data folder for event logs and converts them to standardized dataframes. Implement LSTM training as in the baseline but add hyperparameter tuning for max_epochs: train up to 30 epochs with early stopping; if validation top-3 still trends up near epoch 30, continue to 50. Track best validation top-3 and restore best checkpoint. Save all plottable data (loss curves, val top-3, predictions, ground truth, confusion matrices) as NumPy arrays and consolidate experiment metadata in experiment_data.npy under a hyperparameter-tuning-specific namespace.","overall_plan":"","plot_code":null,"plot_plan":null,"step":1,"id":"95afc8fd95764ce68e602a1cb05b0950","ctime":1757758837.6909113,"_term_out":["Using device: cuda","\n","Execution time: a second seconds (time limit is an hour)."],"parse_metrics_plan":"","parse_metrics_code":"","parse_term_out":null,"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":1.3723392486572266,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"Run produced no meaningful results. The only output was the device print, indicating that dataset loading and training did not execute. Primary root cause: the script searches for XES files under ./data, but per the workspace and helper module conventions, logs are located under ./input. As a result, no datasets were found and the script exited early. Additional issues: (1) mild leakage risk by constructing the activity vocabulary on the full dataset before the time-based split; better to build vocab on train only and map OOV to UNK. (2) The current run did not meet stage goals: it did not evaluate on BPI 2017 and Road_Traffic_Fine_Management_Process, and it did not report required per-log metrics due to data-loading failure. Proposed fixes: (A) Replace load_xes_datasets with the robust loader from ai_scientist/ideas/my_research_topic.py, e.g., from my_research_topic import load_datasets, pick_default_dataset, or at minimum change discovery to prefer ./input and use the provided _resolve_data_dir() logic; support both .xes and .xes.gz. (B) Ensure informative logging when no datasets are found (print discovered directories and available files). (C) Build act2id from train set only, add an UNK token for unseen test activities. (D) After fixing data discovery, explicitly filter lifecycle=\\\"complete\\\" and keep time-based split as implemented. (E) Verify that the script iterates per recognized dataset names (BPI2012, BPI2017, ROAD) and reports next-activity metrics: accuracy, macro-F1, top-3 for each. After these changes, rerun to produce per-log metrics and satisfy the baseline_tuning stage requirements.","exp_results_dir":null,"metric":{"value":null,"maximize":null,"name":null,"description":null},"is_buggy":true,"is_buggy_plots":null,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":[],"plot_paths":[],"plot_analyses":[],"vlm_feedback_summary":[],"datasets_successfully_tested":[],"ablation_name":null,"hyperparam_name":"max_epochs","is_seed_node":false,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"import os\nimport sys\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score\nimport random\nimport math\nimport warnings\n\n# Device handling\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n\n# Reproducibility\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n# Experiment data structure as required\nexperiment_data = {\n    \"lr_tuning\": {\n        # dataset_name: {\n        #   'per_lr': { '0.001': {...}, ... },\n        #   'best_lr': None,\n        #   'best_run': {},\n        # }\n    }\n}\n\n# Try to import pm4py (required)\ntry:\n    import pm4py\nexcept Exception as e:\n    print(\"Error: pm4py is required to load XES files. Please install pm4py.\")\n    pm4py = None\n\n\ndef discover_xes_files(root_dirs):\n    xes_files = []\n    for rd in root_dirs:\n        if not os.path.isdir(rd):\n            continue\n        for root, dirs, files in os.walk(rd):\n            for f in files:\n                if f.lower().endswith(\".xes\") or f.lower().endswith(\".xes.gz\"):\n                    xes_files.append(os.path.join(root, f))\n    # Remove duplicates while preserving order\n    uniq = []\n    seen = set()\n    for p in xes_files:\n        if p not in seen:\n            uniq.append(p)\n            seen.add(p)\n    return uniq\n\n\ndef load_xes_datasets():\n    \"\"\"\n    Load all XES logs found in ./data and current working dir recursively.\n    Convert to unified pandas DataFrame with columns: case_id, activity, timestamp, lifecycle (optional).\n    Returns dict: {dataset_name: df}\n    \"\"\"\n    datasets = {}\n    if pm4py is None:\n        return datasets\n    candidates = discover_xes_files([os.path.join(os.getcwd(), \"data\"), os.getcwd()])\n    if len(candidates) == 0:\n        print(\"No XES files found under ./data or current directory.\")\n    for path in candidates:\n        try:\n            print(f\"Loading XES: {path}\")\n            log = pm4py.read_xes(path)\n            df = pm4py.convert_to_dataframe(log)\n            # Map columns\n            col_map = {}\n            # Case id\n            if \"case:concept:name\" in df.columns:\n                col_map[\"case_id\"] = df[\"case:concept:name\"].astype(str)\n            elif \"case\" in df.columns:\n                col_map[\"case_id\"] = df[\"case\"].astype(str)\n            else:\n                # fallback: group by trace id index if exists\n                if \"trace_id\" in df.columns:\n                    col_map[\"case_id\"] = df[\"trace_id\"].astype(str)\n                else:\n                    # create synthetic\n                    col_map[\"case_id\"] = df.groupby(level=0).cumcount().astype(str)\n            # Activity\n            if \"concept:name\" in df.columns:\n                col_map[\"activity\"] = df[\"concept:name\"].astype(str)\n            elif \"activity\" in df.columns:\n                col_map[\"activity\"] = df[\"activity\"].astype(str)\n            else:\n                # cannot proceed if no activity name\n                print(f\"[warn] No activity column found for {path}, skipping.\")\n                continue\n            # Timestamp\n            if \"time:timestamp\" in df.columns:\n                ts = pd.to_datetime(df[\"time:timestamp\"], utc=True, errors=\"coerce\")\n            elif \"timestamp\" in df.columns:\n                ts = pd.to_datetime(df[\"timestamp\"], utc=True, errors=\"coerce\")\n            else:\n                print(f\"[warn] No timestamp column found for {path}, skipping.\")\n                continue\n            col_map[\"timestamp\"] = ts\n            # Lifecycle (optional)\n            if \"lifecycle:transition\" in df.columns:\n                col_map[\"lifecycle\"] = df[\"lifecycle:transition\"].astype(str)\n            elif \"lifecycle\" in df.columns:\n                col_map[\"lifecycle\"] = df[\"lifecycle\"].astype(str)\n            out = pd.DataFrame(col_map).dropna(subset=[\"timestamp\"])\n            out = out.sort_values([\"case_id\", \"timestamp\"]).reset_index(drop=True)\n            name = os.path.splitext(os.path.basename(path))[0]\n            datasets[name] = out\n        except Exception as e:\n            print(f\"[warn] Failed to load {path}: {e}\")\n    return datasets\n\n\n# Build prefixes\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        mask = df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")\n        if mask.any():\n            df = df[mask]\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}  # 0 for PAD\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        ts_ns = pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy()\n        ts = (ts_ns // 10**9).astype(np.int64)\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str).tolist()], dtype=np.int64\n        )\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            seq_acts = acts_ids[:k].tolist()\n            seq_feats = feats[:k]\n            target = int(acts_ids[k])\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": seq_acts,\n                    \"seq_feats\": seq_feats.copy(),\n                    \"target\": target,\n                    \"last_ts\": int(ts[k - 1]),\n                    \"next_ts\": int(ts[k]),\n                }\n            )\n\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n\n    # Initial normalization (will recompute on train split later)\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n    ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n    for s in samples:\n        if s[\"seq_feats\"].shape[0] > 0:\n            s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n            s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\n# Time-based split by case start time\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    out = {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, preds_probs = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            preds_probs.append(probs.detach().cpu().numpy())\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys)\n    y_pred = np.array(preds_top1)\n    mask = y_true != pad_idx\n    y_true = y_true[mask]\n    y_pred = y_pred[mask]\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    probs_concat = (\n        np.concatenate(preds_probs, axis=0)\n        if len(preds_probs) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return avg_loss, acc, f1, top3, y_true, y_pred, probs_concat\n\n\ndef train_one_run(name, df, max_epochs=12, batch_size=128, max_prefix_len=10, lr=1e-3):\n    # Time split\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    # Prefix samples\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # Re-normalize with train stats\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm_samples(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm_samples(samples_train)\n            norm_samples(samples_val)\n            norm_samples(samples_test)\n\n    if len(samples_train) == 0 or len(act2id) < 2:\n        return None  # not enough data\n\n    ds_train = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_val = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_test = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=True,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_test = DataLoader(\n        ds_test,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n\n    # Model, loss, optimizer\n    model = LSTMBaseline(\n        vocab_size=len(act2id),\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    best_val_top3 = -1.0\n    best_state = None\n    history = {\n        \"epochs\": [],\n        \"train_loss\": [],\n        \"val_loss\": [],\n        \"val_acc\": [],\n        \"val_f1\": [],\n        \"val_top3\": [],\n    }\n\n    for epoch in range(1, max_epochs + 1):\n        model.train()\n        total = 0\n        running_loss = 0.0\n        for batch in dl_train:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            optimizer.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item() * logits.size(0)\n            total += logits.size(0)\n        train_loss = running_loss / max(1, total)\n        val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n            model, dl_val, criterion, device, len(act2id), pad_id\n        )\n\n        history[\"epochs\"].append(epoch)\n        history[\"train_loss\"].append(train_loss)\n        history[\"val_loss\"].append(val_loss)\n        history[\"val_acc\"].append(val_acc)\n        history[\"val_f1\"].append(val_f1)\n        history[\"val_top3\"].append(val_top3)\n\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_state = {\n                k: v.detach().cpu().clone() for k, v in model.state_dict().items()\n            }\n\n    # Restore best\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n\n    # Final evaluation\n    train_loss, train_acc, train_f1, train_top3, _, _, _ = evaluate(\n        model, dl_train, criterion, device, len(act2id), pad_id\n    )\n    val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n        model, dl_val, criterion, device, len(act2id), pad_id\n    )\n    test_loss, test_acc, test_f1, test_top3, y_true_t, y_pred_t, probs_t = evaluate(\n        model, dl_test, criterion, device, len(act2id), pad_id\n    )\n\n    run_summary = {\n        \"vocab_size\": len(act2id),\n        \"pad_id\": pad_id,\n        \"num_train_samples\": len(samples_train),\n        \"num_val_samples\": len(samples_val),\n        \"num_test_samples\": len(samples_test),\n        \"history\": history,\n        \"best_epoch\": int(\n            np.argmax(history[\"val_top3\"]) + 1 if len(history[\"val_top3\"]) > 0 else -1\n        ),\n        \"best_val_top3\": float(best_val_top3),\n        \"final_metrics\": {\n            \"train\": {\n                \"loss\": float(train_loss),\n                \"acc\": float(train_acc),\n                \"macro_f1\": float(train_f1),\n                \"top3\": float(train_top3),\n            },\n            \"val\": {\n                \"loss\": float(val_loss),\n                \"acc\": float(val_acc),\n                \"macro_f1\": float(val_f1),\n                \"top3\": float(val_top3),\n            },\n            \"test\": {\n                \"loss\": float(test_loss),\n                \"acc\": float(test_acc),\n                \"macro_f1\": float(test_f1),\n                \"top3\": float(test_top3),\n            },\n        },\n        \"predictions\": np.array(y_pred_t, dtype=np.int64),\n        \"ground_truth\": np.array(y_true_t, dtype=np.int64),\n        \"probs\": probs_t.astype(np.float32),\n    }\n    return run_summary\n\n\ndef main():\n    datasets = load_xes_datasets()\n    if len(datasets) == 0:\n        print(\"No datasets loaded. Exiting.\")\n        # Save empty structure to comply with requirement\n        np.save(\"experiment_data.npy\", experiment_data, allow_pickle=True)\n        return\n\n    lr_grid = [3e-4, 5e-4, 1e-3, 2e-3]\n    max_epochs = 12\n    batch_size = 128\n    max_prefix_len = 10\n\n    for ds_name, df in datasets.items():\n        print(f\"\\n=== Dataset: {ds_name} ===\")\n        # Cap to 5000 earliest cases for speed (optional, as in baseline)\n        try:\n            starts = (\n                df.sort_values(\"timestamp\")\n                .groupby(\"case_id\")[\"timestamp\"]\n                .min()\n                .reset_index()\n            )\n            if len(starts) > 5000:\n                keep_cases = set(starts.iloc[:5000][\"case_id\"])\n                df_small = df[df[\"case_id\"].isin(keep_cases)].copy()\n            else:\n                df_small = df\n        except Exception:\n            df_small = df\n\n        experiment_data[\"lr_tuning\"].setdefault(ds_name, {})\n        experiment_data[\"lr_tuning\"][ds_name][\"per_lr\"] = {}\n        best_lr = None\n        best_val_top3 = -1.0\n        best_run = None\n\n        for lr in lr_grid:\n            print(f\"Training with lr={lr}\")\n            run = train_one_run(\n                ds_name,\n                df_small,\n                max_epochs=max_epochs,\n                batch_size=batch_size,\n                max_prefix_len=max_prefix_len,\n                lr=lr,\n            )\n            if run is None:\n                print(\n                    \"Not enough data to train for this dataset. Skipping remaining LRs.\"\n                )\n                break\n            # Store run data\n            lr_key = f\"{lr:.4g}\"\n            experiment_data[\"lr_tuning\"][ds_name][\"per_lr\"][lr_key] = {\n                \"metrics\": {\n                    \"train\": [run[\"final_metrics\"][\"train\"]],\n                    \"val\": [run[\"final_metrics\"][\"val\"]],\n                    \"test\": [run[\"final_metrics\"][\"test\"]],\n                },\n                \"losses\": {\n                    \"train\": list(\n                        zip(run[\"history\"][\"epochs\"], run[\"history\"][\"train_loss\"])\n                    ),\n                    \"val\": list(\n                        zip(run[\"history\"][\"epochs\"], run[\"history\"][\"val_loss\"])\n                    ),\n                },\n                \"val_top3_curve\": list(\n                    zip(run[\"history\"][\"epochs\"], run[\"history\"][\"val_top3\"])\n                ),\n                \"val_acc_curve\": list(\n                    zip(run[\"history\"][\"epochs\"], run[\"history\"][\"val_acc\"])\n                ),\n                \"val_f1_curve\": list(\n                    zip(run[\"history\"][\"epochs\"], run[\"history\"][\"val_f1\"])\n                ),\n                \"predictions\": run[\"predictions\"],\n                \"ground_truth\": run[\"ground_truth\"],\n                \"best_epoch\": run[\"best_epoch\"],\n                \"best_val_top3\": run[\"best_val_top3\"],\n                \"num_train_samples\": run[\"num_train_samples\"],\n                \"num_val_samples\": run[\"num_val_samples\"],\n                \"num_test_samples\": run[\"num_test_samples\"],\n                \"vocab_size\": run[\"vocab_size\"],\n            }\n            # Select best by validation top-3\n            if run[\"best_val_top3\"] > best_val_top3:\n                best_val_top3 = run[\"best_val_top3\"]\n                best_lr = lr\n                best_run = run\n\n        experiment_data[\"lr_tuning\"][ds_name][\"best_lr\"] = best_lr\n        experiment_data[\"lr_tuning\"][ds_name][\"best_run\"] = {\n            \"best_val_top3\": float(best_val_top3),\n            \"lr\": best_lr,\n            \"history\": best_run[\"history\"] if best_run is not None else {},\n            \"final_metrics\": best_run[\"final_metrics\"] if best_run is not None else {},\n            \"predictions\": (\n                best_run[\"predictions\"]\n                if best_run is not None\n                else np.array([], dtype=np.int64)\n            ),\n            \"ground_truth\": (\n                best_run[\"ground_truth\"]\n                if best_run is not None\n                else np.array([], dtype=np.int64)\n            ),\n        }\n        print(\n            f\"Selected best lr for {ds_name}: {best_lr} with val_top3={best_val_top3:.4f}\"\n        )\n\n    # Save all experiment data once as a numpy file (as required)\n    np.save(\"experiment_data.npy\", experiment_data, allow_pickle=True)\n    print(\"Saved results to experiment_data.npy\")\n\n\n# Execute\nif __name__ == \"__main__\":\n    main()\n","plan":"Hyperparam tuning name: learning rate (lr).\nI will implement a learning-rate grid search over {3e-4, 5e-4, 1e-3, 2e-3} while keeping other settings fixed, selecting the model by best validation top-3 accuracy. The script loads local XES logs using pm4py, builds time-based splits, trains an LSTM baseline, and evaluates top-1, top-3, and macro-F1. For each dataset and LR, it stores per-epoch losses and metrics, best checkpoints, predictions, and ground truth, and finally selects and reports the best LR. All plottable data and results are stored inside a single experiment_data structure and saved to experiment_data.npy.","overall_plan":"","plot_code":null,"plot_plan":null,"step":2,"id":"adda9b403f3744f1aa79ef815a1e80c9","ctime":1757758759.2632227,"_term_out":["Using device: cuda","\n","Execution time: a second seconds (time limit is an hour)."],"parse_metrics_plan":"","parse_metrics_code":"","parse_term_out":null,"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":1.4832112789154053,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"The run appears to have failed to execute the intended experiments. The only output was 'Using device: cuda' and a generic execution time line; none of the expected dataset discovery/loading, training, or evaluation logs appeared. Root causes and fixes:\n\n1) Data discovery path bug: The script only searches ./data and CWD for XES files, ignoring the mandated ./input directory. Fix: either import and use ai_scientist/ideas/my_research_topic.load_datasets() (which robustly discovers input/*.xes) or extend discover_xes_files to include ./input and its parents.\n\n2) Likely no-dataset early exit: When no datasets are found, the script prints 'No datasets loaded. Exiting.' and quits after saving an empty npy. This matches the minimal output. Fix: ensure correct input path and presence of required logs (BPI 2017 and Road_Traffic_Fine_Management_Process) under input/ so the run proceeds.\n\n3) Requirement mismatch: The stage requires evaluation on BPI 2017 and Road datasets with time-based splits and reporting acc/F1/top-3 per log. The current code would do this only if datasets load; as run, it produced no metrics. Fix: after fixing data loading, verify per-log metrics are printed and saved; explicitly filter/select those two datasets by name.\n\n4) Minor API robustness: pm4py.read_xes/convert_to_dataframe may vary by version. To avoid import/runtime issues, use pm4py.objects.log.importer.xes.importer.apply and pm4py.convert_to_dataframe as in the provided loader.\n\n5) Compliance: The code should rely on the provided loader module to avoid duplication and ensure correct lifecycle/resource handling per constraints.\n\nAfter these fixes, rerun to generate per-log metrics and save experiment_data.npy with populated results.","exp_results_dir":null,"metric":{"value":null,"maximize":null,"name":null,"description":null},"is_buggy":true,"is_buggy_plots":null,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":[],"plot_paths":[],"plot_analyses":[],"vlm_feedback_summary":[],"datasets_successfully_tested":[],"ablation_name":null,"hyperparam_name":"learning rate (lr)","is_seed_node":false,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"import os\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score\nimport random\nimport math\nfrom datetime import datetime\nfrom typing import Dict, List, Tuple\n\n# Device handling\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n# Working dir\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\n# Experiment data per instruction\nexperiment_data = {\n    \"hyperparam_tuning_type_1\": {\n        # Will be filled as:\n        # dataset_name: {\n        #   'batch_size_64': {...},\n        #   'batch_size_128': {...},\n        #   'batch_size_256': {...},\n        #   'best': {'batch_size': 128, 'val_top3': 0.72, ...}\n        # }\n    }\n}\n\n\n# Reproducibility\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# pm4py loading\ndef try_import_pm4py():\n    try:\n        import pm4py  # noqa\n\n        return True\n    except Exception as e:\n        print(f\"[warn] pm4py not available: {e}\")\n        return False\n\n\ndef load_xes_to_df(path: str) -> pd.DataFrame:\n    from pm4py.objects.log.importer.xes import importer as xes_importer\n    from pm4py.objects.conversion.log import converter as log_converter\n\n    log = xes_importer.apply(path)\n    df = log_converter.apply(log, variant=log_converter.Variants.TO_DATA_FRAME)\n    # Standardize columns\n    # Expecting 'case:concept:name', 'concept:name', 'time:timestamp', 'lifecycle:transition' (optional)\n    if (\n        \"case:concept:name\" not in df.columns\n        or \"concept:name\" not in df.columns\n        or \"time:timestamp\" not in df.columns\n    ):\n        raise ValueError(\"Unexpected XES columns\")\n    out = pd.DataFrame()\n    out[\"case_id\"] = df[\"case:concept:name\"].astype(str)\n    out[\"activity\"] = df[\"concept:name\"].astype(str)\n    out[\"timestamp\"] = pd.to_datetime(df[\"time:timestamp\"], utc=True)\n    if \"lifecycle:transition\" in df.columns:\n        out[\"lifecycle\"] = df[\"lifecycle:transition\"].astype(str)\n    else:\n        out[\"lifecycle\"] = \"complete\"\n    return out.sort_values([\"case_id\", \"timestamp\"]).reset_index(drop=True)\n\n\ndef discover_xes_files(search_dirs: List[str]) -> Dict[str, str]:\n    # Map friendly names to files if found\n    candidates = {\n        \"BPI2012\": [\"BPI_Challenge_2012.xes\", \"BPI2012.xes\", \"bpi2012.xes\"],\n        \"BPI2017\": [\"BPI_Challenge_2017.xes\", \"BPI2017.xes\", \"bpi2017.xes\"],\n        \"ROAD\": [\"road_traffic_fines.xes\", \"Road_Traffic_Fines.xes\", \"road.xes\"],\n    }\n    found = {}\n    for d in search_dirs:\n        if not os.path.isdir(d):\n            continue\n        for root, _, files in os.walk(d):\n            lower = {f.lower(): f for f in files}\n            for key, names in candidates.items():\n                for nm in names:\n                    if nm.lower() in lower and key not in found:\n                        found[key] = os.path.join(root, lower[nm.lower()])\n    return found\n\n\ndef load_datasets_pm4py() -> Dict[str, pd.DataFrame]:\n    ds = {}\n    has_pm4py = try_import_pm4py()\n    if not has_pm4py:\n        return ds\n    paths = discover_xes_files([os.getcwd(), os.path.join(os.getcwd(), \"data\")])\n    for name, p in paths.items():\n        try:\n            df = load_xes_to_df(p)\n            ds[name] = df\n            print(f\"Loaded {name} from {p} with {len(df)} events\")\n        except Exception as e:\n            print(f\"[warn] Failed loading {name} from {p}: {e}\")\n    return ds\n\n\n# Synthetic fallback if no XES\ndef make_synthetic_df(n_cases=200, max_events=12, seed=42) -> pd.DataFrame:\n    rng = np.random.default_rng(seed)\n    activities = [\"A\", \"B\", \"C\", \"D\", \"E\", \"F\"]\n    rows = []\n    base_time = int(pd.Timestamp(\"2020-01-01\", tz=\"UTC\").value // 10**9)\n    for c in range(n_cases):\n        T = rng.integers(3, max_events)\n        start = base_time + int(rng.integers(0, 60 * 60 * 24 * 30))\n        ts = np.cumsum(rng.integers(10, 1000, size=T)) + start\n        for t in ts:\n            rows.append(\n                {\n                    \"case_id\": f\"C{c:05d}\",\n                    \"activity\": str(rng.choice(activities)),\n                    \"timestamp\": pd.to_datetime(t, unit=\"s\", utc=True),\n                    \"lifecycle\": \"complete\",\n                }\n            )\n    df = pd.DataFrame(rows).sort_values([\"case_id\", \"timestamp\"]).reset_index(drop=True)\n    return df\n\n\n# Build prefixes\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n        if len(df) == 0:\n            df = df.sort_values([\"case_id\", \"timestamp\"])\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        ts_ns = pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy()\n        ts = (ts_ns // 10**9).astype(np.int64)\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str).tolist()], dtype=np.int64\n        )\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            seq_acts = acts_ids[:k].tolist()\n            seq_feats = feats[:k]\n            target = int(acts_ids[k])\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": seq_acts,\n                    \"seq_feats\": seq_feats.copy(),\n                    \"target\": target,\n                    \"last_ts\": int(ts[k - 1]),\n                    \"next_ts\": int(ts[k]),\n                }\n            )\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n    ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n    for s in samples:\n        if s[\"seq_feats\"].shape[0] > 0:\n            s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n            s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\n# Time split\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    out = {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, preds_probs = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            preds_probs.append(probs.detach().cpu().numpy())\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys)\n    y_pred = np.array(preds_top1)\n    mask = y_true != pad_idx\n    y_true = y_true[mask]\n    y_pred = y_pred[mask]\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    probs_concat = (\n        np.concatenate(preds_probs, axis=0)\n        if len(preds_probs) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return avg_loss, acc, f1, top3, y_true, y_pred, probs_concat\n\n\ndef train_eval_one_setting(\n    name, df, batch_size=128, max_epochs=10, max_prefix_len=10, lr=1e-3, cap_cases=5000\n):\n    # Optionally cap cases for speed\n    try:\n        starts = (\n            df.sort_values(\"timestamp\")\n            .groupby(\"case_id\")[\"timestamp\"]\n            .min()\n            .reset_index()\n        )\n        if len(starts) > cap_cases:\n            keep_cases = set(starts.iloc[:cap_cases][\"case_id\"])\n            df = df[df[\"case_id\"].isin(keep_cases)].copy()\n    except Exception:\n        pass\n    # Time-based split\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm_samples(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm_samples(samples_train)\n            norm_samples(samples_val)\n            norm_samples(samples_test)\n    print(\n        f\"Samples train/val/test: {len(samples_train)}/{len(samples_val)}/{len(samples_test)}; vocab={len(act2id)}\"\n    )\n    if len(samples_train) == 0 or len(act2id) < 2:\n        print(\"Not enough data to train for this setting. Skipping.\")\n        return None\n    ds_train = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_val = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_test = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=True,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_test = DataLoader(\n        ds_test,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n\n    model = LSTMBaseline(\n        vocab_size=len(act2id),\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    best_val_top3 = -1.0\n    best_state = None\n    hist = {\"train_loss\": [], \"val_loss\": [], \"val_top3\": []}\n    for epoch in range(1, max_epochs + 1):\n        model.train()\n        total = 0\n        running_loss = 0.0\n        for batch in dl_train:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            optimizer.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item() * logits.size(0)\n            total += logits.size(0)\n        train_loss = running_loss / max(1, total)\n        val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n            model, dl_val, criterion, device, len(act2id), pad_id\n        )\n        print(\n            f\"[bs={batch_size}] Epoch {epoch}: val_loss={val_loss:.4f} val_acc={val_acc:.4f} val_f1={val_f1:.4f} val_top3={val_top3:.4f}\"\n        )\n        hist[\"train_loss\"].append(train_loss)\n        hist[\"val_loss\"].append(val_loss)\n        hist[\"val_top3\"].append(val_top3)\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_state = {\n                k: v.detach().cpu().clone() for k, v in model.state_dict().items()\n            }\n\n    # Load best and evaluate\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n\n    train_loss, train_acc, train_f1, train_top3, _, _, _ = evaluate(\n        model, dl_train, criterion, device, len(act2id), pad_id\n    )\n    val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n        model, dl_val, criterion, device, len(act2id), pad_id\n    )\n    test_loss, test_acc, test_f1, test_top3, y_true_t, y_pred_t, probs_t = evaluate(\n        model, dl_test, criterion, device, len(act2id), pad_id\n    )\n\n    results = {\n        \"settings\": {\n            \"batch_size\": batch_size,\n            \"max_epochs\": max_epochs,\n            \"max_prefix_len\": max_prefix_len,\n            \"lr\": lr,\n            \"vocab_size\": len(act2id),\n        },\n        \"losses\": {\n            \"train\": [(i + 1, float(x)) for i, x in enumerate(hist[\"train_loss\"])],\n            \"val\": [(i + 1, float(x)) for i, x in enumerate(hist[\"val_loss\"])],\n        },\n        \"metrics\": {\n            \"val_top3_curve\": [\n                (i + 1, float(x)) for i, x in enumerate(hist[\"val_top3\"])\n            ],\n            \"train_final\": {\n                \"loss\": float(train_loss),\n                \"acc\": float(train_acc),\n                \"macro_f1\": float(train_f1),\n                \"top3\": float(train_top3),\n            },\n            \"val_final\": {\n                \"loss\": float(val_loss),\n                \"acc\": float(val_acc),\n                \"macro_f1\": float(val_f1),\n                \"top3\": float(val_top3),\n            },\n            \"test_final\": {\n                \"loss\": float(test_loss),\n                \"acc\": float(test_acc),\n                \"macro_f1\": float(test_f1),\n                \"top3\": float(test_top3),\n            },\n        },\n        \"predictions\": np.array(y_pred_t, dtype=np.int64),\n        \"ground_truth\": np.array(y_true_t, dtype=np.int64),\n        \"probs\": probs_t,  # ndarray\n        \"pad_idx\": int(pad_id),\n        \"act2id\": act2id,\n    }\n    return results\n\n\ndef main():\n    # Load datasets using pm4py, fallback to synthetic if none found\n    datasets = load_datasets_pm4py()\n    if len(datasets) == 0:\n        print(\"[info] No XES datasets found. Using synthetic dataset as fallback.\")\n        datasets = {\"SYNTH\": make_synthetic_df(n_cases=500, max_events=15)}\n    # Hyperparameter grid\n    batch_grid = [64, 128, 256]\n    max_epochs = 10\n    max_prefix_len = 10\n    lr = 1e-3\n\n    for ds_name, df in datasets.items():\n        experiment_data[\"hyperparam_tuning_type_1\"].setdefault(ds_name, {})\n        best_bs = None\n        best_val_top3 = -1.0\n        for bs in batch_grid:\n            try:\n                res = train_eval_one_setting(\n                    ds_name,\n                    df,\n                    batch_size=bs,\n                    max_epochs=max_epochs,\n                    max_prefix_len=max_prefix_len,\n                    lr=lr,\n                )\n            except RuntimeError as e:\n                print(f\"[warn] Runtime error for batch_size={bs}: {e}\")\n                res = None\n            key = f\"batch_size_{bs}\"\n            if res is None:\n                experiment_data[\"hyperparam_tuning_type_1\"][ds_name][key] = {\n                    \"error\": \"insufficient_data_or_runtime_error\"\n                }\n                continue\n            experiment_data[\"hyperparam_tuning_type_1\"][ds_name][key] = {\n                \"settings\": res[\"settings\"],\n                \"losses\": res[\"losses\"],\n                \"metrics\": res[\"metrics\"],\n                \"predictions\": res[\"predictions\"],\n                \"ground_truth\": res[\"ground_truth\"],\n                \"pad_idx\": res[\"pad_idx\"],\n                \"vocab_size\": res[\"settings\"][\"vocab_size\"],\n            }\n            # Track best by validation top-3 final\n            val_top3_final = res[\"metrics\"][\"val_final\"][\"top3\"]\n            if val_top3_final > best_val_top3:\n                best_val_top3 = val_top3_final\n                best_bs = bs\n                # store some best-level details\n                experiment_data[\"hyperparam_tuning_type_1\"][ds_name][\"best\"] = {\n                    \"batch_size\": best_bs,\n                    \"val_top3\": float(best_val_top3),\n                    \"note\": \"Consider linear LR scaling if very large batches help.\",\n                }\n        print(\n            f\"[{ds_name}] Best batch_size={best_bs} with val_top3={best_val_top3:.4f}\"\n        )\n\n    # Save all plottable data as a single numpy file\n    # Convert numpy arrays to lists where necessary for serialization via np.save of dict\n    # But numpy can save Python object dict with allow_pickle=True by default.\n    np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n\n\nif __name__ == \"__main__\":\n    main()\n","plan":"Hyperparam tuning name: batch_size.\nWe will implement a small grid search over DataLoader batch_size values {64, 128, 256} while keeping all other settings fixed. For each dataset and batch size, we train the baseline LSTM and record validation top-3 accuracy and loss across epochs, then select the best batch size by highest validation top-3. We use pm4py to load local XES files (falling back to a small synthetic dataset if unavailable), perform time-based splits, and store all plottable data (losses, metrics, predictions) inside a single experiment_data object saved to experiment_data.npy. If very large batches shine, a note is printed suggesting linear LR scaling as a follow-up.","overall_plan":"","plot_code":null,"plot_plan":null,"step":3,"id":"8809469610964dfb89ac1f461173f888","ctime":1757758835.4321167,"_term_out":["Using device: cuda","\n","Execution time: a moment seconds (time limit is an hour)."],"parse_metrics_plan":"","parse_metrics_code":"","parse_term_out":null,"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":0.8928101062774658,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"The run produced only \u201cUsing device: cuda\u201d and no further logs or results. This indicates the experiment did not actually execute training/evaluation. Likely issues: (1) Dataset discovery is too brittle and ignores the mandated input directory. The code only searches CWD and ./data for very specific filenames and does not consider common names (e.g., Road_Traffic_Fine_Management_Process.xes) or .xes.gz, nor the workspace ./input used by the provided loader. If pm4py is missing or files aren\u2019t found, it silently falls back to a synthetic dataset, violating the requirement to evaluate on BPI 2017 and ROAD. (2) Even if it proceeded, the script does not print any per-log metrics in the provided output; no training epochs or best batch-size summary appeared, so main likely didn\u2019t run or logging was suppressed/crashed early. (3) Requirements call for evaluating on two more BPM logs; this was not achieved in the observed run. Suggested fixes: \u2022 Integrate the robust loader from ai_scientist/ideas/my_research_topic.py (load_datasets) which searches ./input and handles .xes.gz and real filenames; or expand discover_xes_files to search ./input and ./workspace paths, support patterns like *.xes* and names containing BPI_Challenge_2012/2017 and Road_Traffic_Fine_Management_Process. \u2022 Ensure pm4py is installed and fail clearly if missing instead of defaulting to synthetic for this stage. \u2022 Add explicit logging in main to print dataset names, sample counts, per-epoch val metrics, and final per-log metrics and chosen best batch size. \u2022 Verify __main__ actually invokes main in the executed script. \u2022 Optionally build the act vocabulary on training data only to avoid minor leakage. After fixing, re-run with time-based splits and report next-activity metrics (acc/macro-F1/top-3) for BPI2017 and ROAD.","exp_results_dir":null,"metric":{"value":null,"maximize":null,"name":null,"description":null},"is_buggy":true,"is_buggy_plots":null,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":[],"plot_paths":[],"plot_analyses":[],"vlm_feedback_summary":[],"datasets_successfully_tested":[],"ablation_name":null,"hyperparam_name":"batch_size","is_seed_node":false,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"import os\nimport glob\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score\nimport random\nimport math\nimport warnings\n\n\n# Ensure deterministic behavior\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n# Device handling\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n# Experiment data structure per instruction\nexperiment_data = {\n    \"weight_decay_tuning\": {\n        # dataset_name will be added dynamically\n    }\n}\n\n# Try import pm4py for XES loading\ntry:\n    import pm4py\n    from pm4py.objects.log.importer.xes import importer as xes_importer\nexcept Exception as e:\n    raise RuntimeError(\n        \"pm4py is required to load local XES files. Please install pm4py.\"\n    ) from e\n\n\n# Utilities to load local XES datasets using pm4py\ndef _convert_event_log_to_df(log):\n    # pm4py event log to pandas DataFrame with columns: case_id, activity, timestamp, lifecycle (if any)\n    records = []\n    for trace in log:\n        case_id = trace.attributes.get(\"concept:name\", None)\n        for ev in trace:\n            act = ev.get(\"concept:name\", None)\n            ts = ev.get(\"time:timestamp\", None)\n            lifecycle = ev.get(\"lifecycle:transition\", None)\n            records.append(\n                {\n                    \"case_id\": case_id,\n                    \"activity\": act,\n                    \"timestamp\": ts,\n                    \"lifecycle\": lifecycle,\n                }\n            )\n    df = pd.DataFrame(records)\n    # Drop rows with missing essentials\n    df = df.dropna(subset=[\"case_id\", \"activity\", \"timestamp\"])\n    # Ensure timestamp type\n    df[\"timestamp\"] = pd.to_datetime(df[\"timestamp\"], utc=True)\n    df[\"case_id\"] = df[\"case_id\"].astype(str)\n    df[\"activity\"] = df[\"activity\"].astype(str)\n    if \"lifecycle\" in df.columns:\n        df[\"lifecycle\"] = df[\"lifecycle\"].astype(str)\n    return df\n\n\ndef load_local_xes_datasets(search_dirs=None):\n    # Search for .xes or .xes.gz within current directory and given search_dirs\n    if search_dirs is None:\n        search_dirs = [os.getcwd()]\n    files = []\n    for d in search_dirs:\n        files.extend(glob.glob(os.path.join(d, \"**\", \"*.xes\"), recursive=True))\n        files.extend(glob.glob(os.path.join(d, \"**\", \"*.xes.gz\"), recursive=True))\n    datasets = {}\n    # Try to identify known BPM datasets by filename patterns; else load all with a generic name\n    preferred = {\n        \"BPI2012\": [\"2012\", \"bpi2012\"],\n        \"BPI2017\": [\"2017\", \"bpi2017\"],\n        \"ROAD\": [\"road\", \"Road\"],\n    }\n    assigned = set()\n    # Assign by preference\n    for name, patterns in preferred.items():\n        for f in files:\n            low = os.path.basename(f).lower()\n            if any(p in low for p in patterns) and f not in assigned:\n                try:\n                    log = xes_importer.apply(f)\n                    df = _convert_event_log_to_df(log)\n                    # Keep earliest 5000 cases for speed (as in base code)\n                    starts = (\n                        df.sort_values(\"timestamp\")\n                        .groupby(\"case_id\")[\"timestamp\"]\n                        .min()\n                        .reset_index()\n                    )\n                    if len(starts) > 5000:\n                        keep_cases = set(starts.iloc[:5000][\"case_id\"])\n                        df = df[df[\"case_id\"].isin(keep_cases)].copy()\n                    datasets[name] = df\n                    assigned.add(f)\n                    break\n                except Exception as e:\n                    print(f\"[warn] Failed to load {f}: {e}\")\n    # Load remaining files with generic names if none of preferred matched\n    idx = 1\n    for f in files:\n        if f in assigned:\n            continue\n        try:\n            log = xes_importer.apply(f)\n            df = _convert_event_log_to_df(log)\n            starts = (\n                df.sort_values(\"timestamp\")\n                .groupby(\"case_id\")[\"timestamp\"]\n                .min()\n                .reset_index()\n            )\n            if len(starts) > 5000:\n                keep_cases = set(starts.iloc[:5000][\"case_id\"])\n                df = df[df[\"case_id\"].isin(keep_cases)].copy()\n            name = f\"DATA_{idx}\"\n            idx += 1\n            datasets[name] = df\n        except Exception as e:\n            print(f\"[warn] Failed to load {f}: {e}\")\n    if len(datasets) == 0:\n        raise RuntimeError(\n            \"No XES datasets found in the current directory or subdirectories.\"\n        )\n    return datasets\n\n\n# Build prefixes\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        # Keep only 'complete' transitions if lifecycle exists; fallback to sorted if empty\n        df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n        if len(df) == 0:\n            df = df.copy()\n            df = df.sort_values([\"case_id\", \"timestamp\"])\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}  # 0 for PAD\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        ts_ns = pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy()\n        ts = (ts_ns // 10**9).astype(np.int64)\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str).tolist()], dtype=np.int64\n        )\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            seq_acts = acts_ids[:k].tolist()\n            seq_feats = feats[:k]\n            target = int(acts_ids[k])\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": seq_acts,\n                    \"seq_feats\": seq_feats.copy(),\n                    \"target\": target,\n                    \"last_ts\": int(ts[k - 1]),\n                    \"next_ts\": int(ts[k]),\n                }\n            )\n\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n    ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n    for s in samples:\n        if s[\"seq_feats\"].shape[0] > 0:\n            s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n            s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\n# Time-based split by case start time\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)  # includes PAD index\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    out = {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1 = [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys)\n    y_pred = np.array(preds_top1)\n    mask = y_true != pad_idx\n    y_true = y_true[mask]\n    y_pred = y_pred[mask]\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    return avg_loss, acc, f1, top3, y_true, y_pred\n\n\ndef train_with_weight_decay(\n    name,\n    df,\n    max_epochs=10,\n    batch_size=128,\n    max_prefix_len=10,\n    lr=1e-3,\n    weight_decay=0.0,\n):\n    # Split and build samples\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # Normalize features using train stats\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm_samples(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm_samples(samples_train)\n            norm_samples(samples_val)\n            norm_samples(samples_test)\n    # Datasets\n    ds_train = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_val = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_test = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    if len(ds_train) == 0 or len(act2id) < 2:\n        return None  # not enough data\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=True,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_test = DataLoader(\n        ds_test,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    # Model\n    model = LSTMBaseline(\n        vocab_size=len(act2id),\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr, weight_decay=weight_decay)\n    # Training loop\n    best_val_top3 = -1.0\n    best_state = None\n    history = {\"train_loss\": [], \"val_loss\": [], \"val_top3\": []}\n    for epoch in range(1, max_epochs + 1):\n        model.train()\n        total = 0\n        running_loss = 0.0\n        for batch in dl_train:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            optimizer.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item() * logits.size(0)\n            total += logits.size(0)\n        train_loss = running_loss / max(1, total)\n        val_loss, val_acc, val_f1, val_top3, _, _ = evaluate(\n            model, dl_val, criterion, device, len(act2id), pad_id\n        )\n        history[\"train_loss\"].append(train_loss)\n        history[\"val_loss\"].append(val_loss)\n        history[\"val_top3\"].append(val_top3)\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_state = {\n                k: v.detach().cpu().clone() for k, v in model.state_dict().items()\n            }\n    # Load best\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n    # Final eval\n    train_loss, train_acc, train_f1, train_top3, _, _ = evaluate(\n        model, dl_train, criterion, device, len(act2id), pad_id\n    )\n    val_loss, val_acc, val_f1, val_top3, _, _ = evaluate(\n        model, dl_val, criterion, device, len(act2id), pad_id\n    )\n    test_loss, test_acc, test_f1, test_top3, y_true_t, y_pred_t = evaluate(\n        model, dl_test, criterion, device, len(act2id), pad_id\n    )\n    results = {\n        \"config\": {\n            \"weight_decay\": float(weight_decay),\n            \"lr\": float(lr),\n            \"batch_size\": int(batch_size),\n            \"max_epochs\": int(max_epochs),\n            \"max_prefix_len\": int(max_prefix_len),\n            \"vocab_size\": int(len(act2id)),\n        },\n        \"history\": history,\n        \"metrics\": {\n            \"train\": {\n                \"loss\": train_loss,\n                \"acc\": train_acc,\n                \"macro_f1\": train_f1,\n                \"top3\": train_top3,\n            },\n            \"val\": {\n                \"loss\": val_loss,\n                \"acc\": val_acc,\n                \"macro_f1\": val_f1,\n                \"top3\": val_top3,\n            },\n            \"test\": {\n                \"loss\": test_loss,\n                \"acc\": test_acc,\n                \"macro_f1\": test_f1,\n                \"top3\": test_top3,\n            },\n        },\n        \"predictions\": np.array(y_pred_t, dtype=np.int64),\n        \"ground_truth\": np.array(y_true_t, dtype=np.int64),\n        \"pad_id\": int(pad_id),\n        \"num_classes\": int(len(act2id) + 1),\n    }\n    return results\n\n\ndef main():\n    datasets = load_local_xes_datasets()\n    weight_decays = [0.0, 1e-5, 1e-4, 5e-4, 1e-3]\n    # Training settings (fixed across tuning)\n    max_epochs = 10\n    batch_size = 128\n    max_prefix_len = 10\n    lr = 1e-3\n\n    for dname, df in datasets.items():\n        print(\n            f\"\\n=== Dataset: {dname} | cases={df['case_id'].nunique()} events={len(df)} ===\"\n        )\n        experiment_data[\"weight_decay_tuning\"][dname] = {\"per_weight\": [], \"best\": None}\n        best_val_top3 = -1.0\n        best_result = None\n        for wd in weight_decays:\n            print(f\"Tuning weight_decay={wd}\")\n            res = train_with_weight_decay(\n                dname,\n                df,\n                max_epochs=max_epochs,\n                batch_size=batch_size,\n                max_prefix_len=max_prefix_len,\n                lr=lr,\n                weight_decay=wd,\n            )\n            if res is None:\n                print(\n                    \"Not enough data to train for this dataset. Skipping remaining weight decays.\"\n                )\n                break\n            # Record per-weight results\n            experiment_data[\"weight_decay_tuning\"][dname][\"per_weight\"].append(res)\n            val_top3 = res[\"metrics\"][\"val\"][\"top3\"]\n            print(f\" -> val_top3={val_top3:.4f} (wd={wd})\")\n            if val_top3 > best_val_top3:\n                best_val_top3 = val_top3\n                best_result = res\n        if best_result is not None:\n            experiment_data[\"weight_decay_tuning\"][dname][\"best\"] = best_result\n            print(\n                f\"[{dname}] Selected weight_decay={best_result['config']['weight_decay']} with val_top3={best_val_top3:.4f}\"\n            )\n        else:\n            print(f\"[{dname}] No valid model trained.\")\n\n    # Save all plottable data and metrics in a single file as required\n    # Convert numpy arrays where appropriate to ensure np.save works; keep structure\n    np.save(\"experiment_data.npy\", experiment_data, allow_pickle=True)\n    print(\"Saved experiment data to experiment_data.npy\")\n\n\nif __name__ == \"__main__\":\n    main()\n","plan":"Hyperparam tuning name: weight_decay.\nI will add a hyperparameter tuning loop over weight_decay values [0, 1e-5, 1e-4, 5e-4, 1e-3], keeping all other training settings fixed. For each dataset loaded via pm4py from local XES files, I will train a model per weight decay, select the best by validation top-3 accuracy, and then report/train/test metrics of the selected model. I will store comprehensive per-weight results and the final selected model\u2019s results in a single experiment_data structure and save it once as experiment_data.npy. Time-based splits and BPM-relevant metrics (accuracy, macro-F1, top-3) are preserved.","overall_plan":"","plot_code":null,"plot_plan":null,"step":4,"id":"28ff0ab9ab904c7b8042dbf7d450c79f","ctime":1757758917.3912163,"_term_out":["Using device: cuda","\n","Execution time: a second seconds (time limit is an hour)."],"parse_metrics_plan":"","parse_metrics_code":"","parse_term_out":null,"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":1.6244087219238281,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"The run produced only \"Using device: cuda\" and an execution-time line, with no dataset discovery, no tuning loop output, no metrics, and no saved experiment_data.npy. This indicates the training/evaluation did not execute as intended. Likely causes and concrete fixes:\n\n1) Dataset discovery/pm4py:\n   - If pm4py is missing, the script raises a RuntimeError and exits. Add a clear install guard and fail-fast message, or catch and print before exiting.\n   - The loader searches recursively from os.getcwd(); in the AI-Scientist/BPM-Scientist layout logs reside under ./input. Ensure explicit inclusion of ./input and ./data and use the robust resolver from ai_scientist/ideas/my_research_topic._resolve_data_dir. Example fix:\n       data_root = Path(\"input\") if (Path(\"input\").exists()) else Path.cwd()\n       files = list(data_root.rglob(\"*.xes\")) + list(data_root.rglob(\"*.xes.gz\"))\n\n2) Lifecycle filtering bug causing empty datasets:\n   - build_prefix_dataset drops all events when a lifecycle column exists but is empty/NaN, because df[\"lifecycle\"].astype(str).eq(\"complete\") yields false for all rows. Fix by conditioning on actual presence of the value 'complete' before filtering:\n       if \"lifecycle\" in df.columns and df[\"lifecycle\"].notna().any() and df[\"lifecycle\"].astype(str).str.contains(\"complete\", case=False).any():\n           df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n       df = df.sort_values([\"case_id\",\"timestamp\"])  # unconditionally sort after\n\n3) Evaluation/logging:\n   - Add prints per dataset for val/test metrics (acc, macro-F1, top-3) so progress is visible.\n   - Save experiment_data.npy only after successful runs; print its path.\n\n4) Minor modeling issues:\n   - Exclude PAD class from output logits/metrics by setting output size to vocab_size (without +1) and mapping labels accordingly; or mask PAD in loss.\n   - Ensure time-based split uses case start times (already done) and avoid leakage by removing the initial global normalization in build_prefix_dataset; only normalize based on train stats.\n\nAfter these fixes, rerun to evaluate at least BPI 2017 and ROAD logs with time-based splits and report per-log acc/macro-F1/top-3 for next-activity.","exp_results_dir":null,"metric":{"value":null,"maximize":null,"name":null,"description":null},"is_buggy":true,"is_buggy_plots":null,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":[],"plot_paths":[],"plot_analyses":[],"vlm_feedback_summary":[],"datasets_successfully_tested":[],"ablation_name":null,"hyperparam_name":"weight_decay","is_seed_node":false,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"import os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score, confusion_matrix\nfrom pathlib import Path\nfrom typing import Dict, List, Optional, Tuple\nimport random\nfrom datetime import datetime\n\n# Device handling (mandatory)\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n\n# Reproducibility\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# ---------------- Robust XES discovery & loading ----------------\ndef _has_xes(dirpath: Path) -> bool:\n    try:\n        return dirpath.is_dir() and (\n            any(dirpath.glob(\"*.xes\")) or any(dirpath.glob(\"*.xes.gz\"))\n        )\n    except Exception:\n        return False\n\n\ndef _resolve_data_dir() -> Path:\n    candidates: List[Path] = []\n    candidates += [Path(\"input\").resolve(), (Path.cwd() / \"input\").resolve()]\n    cwd = Path.cwd().resolve()\n    for base in [cwd, *cwd.parents]:\n        candidates.append((base / \"data\").resolve())\n        candidates.append((base / \"input\").resolve())\n    candidates += [\n        Path(\"/workspace/input\"),\n        Path(\"/workspace/data\"),\n        Path(\"/workspace/ai_scientist/data\"),\n        Path(\"/workspace/AI-Scientist-v2/data\"),\n        Path(\"/workspace/experiments/data\"),\n        Path(\"/workspace/ai_scientist/input\"),\n        Path(\"/workspace/experiments/input\"),\n    ]\n    seen = set()\n    for p in candidates:\n        if p in seen:\n            continue\n        seen.add(p)\n        if _has_xes(p):\n            print(f\"[data] Using discovered data dir: {p}\")\n            return p\n    tried = \"\\n  - \" + \"\\n  - \".join(str(c) for c in candidates)\n    raise FileNotFoundError(\n        \"Could not locate a directory containing .xes files.\\n\"\n        f\"Checked:{tried}\\n\"\n        \"Tips:\\n\"\n        \"  \u2022 Ensure filenames include BPI 2012/2017 or 'Road_Traffic_Fine_Management_Process' for auto-match.\"\n    )\n\n\ndef _first_match(d: Path, patterns: List[str]) -> Optional[Path]:\n    for pat in patterns:\n        for p in d.glob(pat):\n            if p.is_file():\n                return p\n    return None\n\n\ndef xes_to_df(xes_path: Path) -> pd.DataFrame:\n    try:\n        from pm4py.objects.log.importer.xes import importer as xes_importer\n    except Exception as e:\n        raise ImportError(\"pm4py is required. Install via `pip install pm4py`.\") from e\n    print(f\"[data] Loading XES: {xes_path}\")\n    log = xes_importer.apply(str(xes_path))\n    rows = []\n    for tr in log:\n        case_id = tr.attributes.get(\"concept:name\") or tr.attributes.get(\n            \"case:concept:name\"\n        )\n        for e in tr:\n            rows.append(\n                {\n                    \"case_id\": str(case_id),\n                    \"activity\": str(e.get(\"concept:name\")),\n                    \"lifecycle\": str(e.get(\"lifecycle:transition\", \"complete\")),\n                    \"timestamp\": e.get(\"time:timestamp\"),\n                    \"resource\": str(e.get(\"org:resource\", \"System\")),\n                }\n            )\n    df = pd.DataFrame(rows)\n    df[\"timestamp\"] = pd.to_datetime(df[\"timestamp\"], utc=True, errors=\"coerce\")\n    df = df.dropna(subset=[\"timestamp\"]).reset_index(drop=True)\n    df = df[[\"case_id\", \"activity\", \"lifecycle\", \"timestamp\", \"resource\"]]\n    df = df.sort_values([\"case_id\", \"timestamp\"]).reset_index(drop=True)\n    return df\n\n\ndef load_datasets() -> Dict[str, pd.DataFrame]:\n    data_dir = _resolve_data_dir()\n    patterns = {\n        \"BPI2012\": [\"BPI_Challenge_2012*.xes*\", \"BPI2012*.xes*\", \"*2012*.xes*\"],\n        \"BPI2017\": [\"BPI_Challenge_2017*.xes*\", \"BPI2017*.xes*\", \"*2017*.xes*\"],\n        \"ROAD\": [\n            \"Road_Traffic_Fine_Management_Process*.xes*\",\n            \"*Traffic*Fine*.xes*\",\n            \"*Traffic*.xes*\",\n        ],\n    }\n    loaded: Dict[str, pd.DataFrame] = {}\n    for key, pats in patterns.items():\n        path = _first_match(data_dir, pats)\n        if path is not None:\n            try:\n                loaded[key] = xes_to_df(path)\n                print(\n                    f\"[data] Loaded {key}: events={len(loaded[key])}, cases={loaded[key]['case_id'].nunique()}\"\n                )\n            except Exception as e:\n                print(f\"[warn] Failed to load {key} from {path}: {e}\")\n        else:\n            print(f\"[data] Not found for {key} (patterns {pats})\")\n    if not loaded:\n        # Fallback to any .xes files with generic names\n        any_files = list(data_dir.glob(\"*.xes\")) + list(data_dir.glob(\"*.xes.gz\"))\n        for p in any_files:\n            key = p.stem\n            try:\n                loaded[key] = xes_to_df(p)\n            except Exception as e:\n                print(f\"[warn] Failed to load {p}: {e}\")\n    return loaded\n\n\n# ---------------- Prefix building and splits ----------------\ndef build_prefix_dataset(df, max_prefix_len=15, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        # keep completes if present; otherwise keep all\n        lc_mask = df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")\n        if lc_mask.any():\n            df = df[lc_mask]\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}  # 0 for PAD\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n    samples = []\n    for cid, g in df.groupby(\"case_id\", sort=False):\n        g = g.sort_values(\"timestamp\")\n        ts = (\n            pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy() // 10**9\n        )\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str)], dtype=np.int64\n        )\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            samples.append(\n                {\n                    \"case_id\": str(cid),\n                    \"seq_acts\": acts_ids[:k].tolist(),\n                    \"seq_feats\": feats[:k].copy(),\n                    \"target\": int(acts_ids[k]),\n                }\n            )\n    # Normalize time deltas and since_start using global (temporary) stats; will re-norm by train stats later\n    if len(samples) > 0:\n        all_feats = np.concatenate(\n            [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n        )\n        dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n        ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n        for s in samples:\n            if s[\"seq_feats\"].shape[0] > 0:\n                s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.groupby(\"case_id\", as_index=False)[\"timestamp\"]\n        .min()\n        .sort_values(\"timestamp\")\n    )\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"].astype(str))\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"].astype(str))\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"].astype(str))\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=15, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\n# ---------------- Model ----------------\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.3)\n        self.fc = nn.Linear(hidden, vocab_size + 1)  # includes PAD\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    out = {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n    return out\n\n\n# ---------------- Metrics ----------------\ndef compute_ece(probs: np.ndarray, y_true: np.ndarray, n_bins: int = 10) -> float:\n    # probs: (N, C), y_true: (N,)\n    if probs.size == 0 or y_true.size == 0:\n        return 0.0\n    confidences = probs.max(axis=1)\n    predictions = probs.argmax(axis=1)\n    accuracies = (predictions == y_true).astype(np.float32)\n    bins = np.linspace(0.0, 1.0, n_bins + 1)\n    ece = 0.0\n    for i in range(n_bins):\n        mask = (confidences > bins[i]) & (\n            confidences <= bins[i + 1] if i < n_bins - 1 else confidences <= bins[i + 1]\n        )\n        if not np.any(mask):\n            continue\n        bin_acc = accuracies[mask].mean()\n        bin_conf = confidences[mask].mean()\n        ece += (np.sum(mask) / len(confidences)) * abs(bin_acc - bin_conf)\n    return float(ece)\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, probs_list = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            # Exclude PAD from being predicted by setting its logit very low\n            logits[:, pad_idx] = -1e9\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            probs_list.append(probs.detach().cpu().numpy())\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys, dtype=np.int64)\n    y_pred = np.array(preds_top1, dtype=np.int64)\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    probs_concat = (\n        np.concatenate(probs_list, axis=0)\n        if len(probs_list) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    ece = compute_ece(probs_concat, y_true, n_bins=10)\n    return avg_loss, acc, f1, top3, ece, y_true, y_pred, probs_concat\n\n\n# ---------------- Training & Tuning ----------------\ndef train_with_epoch_tuning(\n    name,\n    df,\n    base_epochs=40,\n    maybe_extend_to=60,\n    batch_size=256,\n    max_prefix_len=15,\n    lr=3e-4,\n):\n    print(f\"\\n=== Dataset: {name} ===\")\n    # Time-based split\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    # Build samples and vocab\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    # Filter splits\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # Recompute normalization using train samples only (no leakage)\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm_samples(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm_samples(samples_train)\n            norm_samples(samples_val)\n            norm_samples(samples_test)\n    print(\n        f\"Samples train/val/test: {len(samples_train)}/{len(samples_val)}/{len(samples_test)}; vocab={len(act2id)}\"\n    )\n    if len(samples_train) == 0 or len(act2id) < 2:\n        print(\"Not enough data to train. Skipping.\")\n        return None\n\n    ds_train = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_val = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_test = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=True,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_test = DataLoader(\n        ds_test,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n\n    # Model\n    model = LSTMBaseline(\n        vocab_size=len(act2id),\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    # Training with early stopping and potential extension\n    best_val_top3 = -1.0\n    best_state = None\n    best_epoch = 0\n    hist = {\n        \"train_loss\": [],\n        \"val_loss\": [],\n        \"val_top3\": [],\n        \"val_acc\": [],\n        \"val_f1\": [],\n        \"val_ece\": [],\n    }\n    patience = 8\n    no_improve = 0\n\n    def train_epochs(n_epochs, start_epoch_idx=0):\n        nonlocal best_val_top3, best_state, best_epoch, no_improve\n        epochs_run = 0\n        for e in range(1, n_epochs + 1):\n            epoch = start_epoch_idx + e\n            model.train()\n            total = 0\n            running_loss = 0.0\n            for batch in dl_train:\n                batch = {\n                    k: v.to(device)\n                    for k, v in batch.items()\n                    if isinstance(v, torch.Tensor)\n                }\n                optimizer.zero_grad()\n                logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n                logits[:, pad_id] = -1e9  # mask PAD from being predicted\n                loss = criterion(logits, batch[\"y\"])\n                loss.backward()\n                optimizer.step()\n                running_loss += loss.item() * logits.size(0)\n                total += logits.size(0)\n            train_loss = running_loss / max(1, total)\n            val_loss, val_acc, val_f1, val_top3, val_ece, _, _, _ = evaluate(\n                model, dl_val, criterion, device, len(act2id), pad_id\n            )\n            print(\n                f\"Epoch {epoch}: validation_loss = {val_loss:.4f} | acc={val_acc:.4f} | f1={val_f1:.4f} | top3={val_top3:.4f} | ece={val_ece:.4f}\"\n            )\n            hist[\"train_loss\"].append(train_loss)\n            hist[\"val_loss\"].append(val_loss)\n            hist[\"val_top3\"].append(val_top3)\n            hist[\"val_acc\"].append(val_acc)\n            hist[\"val_f1\"].append(val_f1)\n            hist[\"val_ece\"].append(val_ece)\n            if val_top3 > best_val_top3 + 1e-6:\n                best_val_top3 = val_top3\n                best_state = {\n                    k: v.detach().cpu().clone() for k, v in model.state_dict().items()\n                }\n                best_epoch = epoch\n                no_improve = 0\n            else:\n                no_improve += 1\n            if no_improve >= patience:\n                print(f\"Early stopping (no improvement in {patience} epochs).\")\n                break\n            epochs_run += 1\n        return start_epoch_idx + epochs_run\n\n    last_epoch = train_epochs(base_epochs, start_epoch_idx=0)\n\n    def should_extend(val_top3_hist, base_epochs):\n        if len(val_top3_hist) < min(10, base_epochs):\n            return False\n        last5 = val_top3_hist[-5:]\n        prev5 = val_top3_hist[-10:-5]\n        if len(prev5) < 5:\n            return False\n        mean_gain = np.mean(last5) - np.mean(prev5)\n        condition = (best_epoch >= max(1, base_epochs - 3)) and (mean_gain > 0.002)\n        return condition\n\n    if should_extend(hist[\"val_top3\"], base_epochs) and maybe_extend_to > len(\n        hist[\"train_loss\"]\n    ):\n        print(\n            f\"Extending training to {maybe_extend_to} epochs due to improving validation top-3.\"\n        )\n        if best_state is not None:\n            model.load_state_dict(best_state)\n            model.to(device)\n        # reset patience\n        nonlocal_no_improve = 0  # local variable to avoid interference; but we will reuse no_improve variable\n        no_improve = 0\n        extra_epochs = maybe_extend_to - len(hist[\"train_loss\"])\n        if extra_epochs > 0:\n            last_epoch = train_epochs(\n                extra_epochs, start_epoch_idx=len(hist[\"train_loss\"])\n            )\n\n    # Load best checkpoint\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n\n    # Final evaluations\n    train_loss, train_acc, train_f1, train_top3, train_ece, _, _, _ = evaluate(\n        model, dl_train, criterion, device, len(act2id), pad_id\n    )\n    val_loss, val_acc, val_f1, val_top3, val_ece, _, _, _ = evaluate(\n        model, dl_val, criterion, device, len(act2id), pad_id\n    )\n    test_loss, test_acc, test_f1, test_top3, test_ece, y_true_t, y_pred_t, probs_t = (\n        evaluate(model, dl_test, criterion, device, len(act2id), pad_id)\n    )\n\n    print(\n        f\"[{name}] Train: loss={train_loss:.4f} acc={train_acc:.4f} f1={train_f1:.4f} top3={train_top3:.4f} ece={train_ece:.4f}\"\n    )\n    print(\n        f\"[{name}] Val:   loss={val_loss:.4f} acc={val_acc:.4f} f1={val_f1:.4f} top3={val_top3:.4f} ece={val_ece:.4f}\"\n    )\n    print(\n        f\"[{name}] Test:  loss={test_loss:.4f} acc={test_acc:.4f} f1={test_f1:.4f} top3={test_top3:.4f} ece={test_ece:.4f}\"\n    )\n\n    # Prepare results dict for this dataset\n    results = {\n        \"metrics\": {\n            \"train\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": train_loss,\n                        \"acc\": train_acc,\n                        \"macro_f1\": train_f1,\n                        \"top3\": train_top3,\n                        \"ece\": train_ece,\n                    },\n                )\n            ],\n            \"val\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": val_loss,\n                        \"acc\": val_acc,\n                        \"macro_f1\": val_f1,\n                        \"top3\": val_top3,\n                        \"ece\": val_ece,\n                    },\n                )\n            ],\n            \"test\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": test_loss,\n                        \"acc\": test_acc,\n                        \"macro_f1\": test_f1,\n                        \"top3\": test_top3,\n                        \"ece\": test_ece,\n                    },\n                )\n            ],\n        },\n        \"losses\": {\n            \"train\": list(enumerate(hist[\"train_loss\"], start=1)),\n            \"val\": list(enumerate(hist[\"val_loss\"], start=1)),\n        },\n        \"val_curves\": {\n            \"acc\": list(enumerate(hist[\"val_acc\"], start=1)),\n            \"f1\": list(enumerate(hist[\"val_f1\"], start=1)),\n            \"top3\": list(enumerate(hist[\"val_top3\"], start=1)),\n            \"ece\": list(enumerate(hist[\"val_ece\"], start=1)),\n        },\n        \"predictions\": y_pred_t.tolist(),\n        \"ground_truth\": y_true_t.tolist(),\n        \"epochs_trained\": len(hist[\"train_loss\"]),\n        \"best_val_top3\": best_val_top3,\n        \"best_epoch\": best_epoch,\n        \"vocab_size\": len(act2id),\n        \"pad_idx\": pad_id,\n    }\n\n    # Save arrays\n    base = os.path.join(working_dir, name)\n    np.save(\n        os.path.join(working_dir, f\"{name}_train_loss.npy\"),\n        np.array(hist[\"train_loss\"], dtype=np.float32),\n    )\n    np.save(\n        os.path.join(working_dir, f\"{name}_val_loss.npy\"),\n        np.array(hist[\"val_loss\"], dtype=np.float32),\n    )\n    np.save(\n        os.path.join(working_dir, f\"{name}_val_top3.npy\"),\n        np.array(hist[\"val_top3\"], dtype=np.float32),\n    )\n    np.save(\n        os.path.join(working_dir, f\"{name}_val_acc.npy\"),\n        np.array(hist[\"val_acc\"], dtype=np.float32),\n    )\n    np.save(\n        os.path.join(working_dir, f\"{name}_val_f1.npy\"),\n        np.array(hist[\"val_f1\"], dtype=np.float32),\n    )\n    np.save(\n        os.path.join(working_dir, f\"{name}_val_ece.npy\"),\n        np.array(hist[\"val_ece\"], dtype=np.float32),\n    )\n    np.save(\n        os.path.join(working_dir, f\"{name}_y_true.npy\"),\n        np.array(y_true_t, dtype=np.int64),\n    )\n    np.save(\n        os.path.join(working_dir, f\"{name}_y_pred.npy\"),\n        np.array(y_pred_t, dtype=np.int64),\n    )\n    try:\n        cm = confusion_matrix(y_true_t, y_pred_t)\n        np.save(os.path.join(working_dir, f\"{name}_confusion_matrix.npy\"), cm)\n    except Exception as e:\n        print(f\"[warn] Confusion matrix failed: {e}\")\n    return results\n\n\n# ---------------- Experiment Orchestration ----------------\nexperiment_data = {}\n\n\ndef main():\n    global experiment_data\n    datasets = load_datasets()\n    if len(datasets) == 0:\n        print(\"No datasets found. Exiting after saving empty experiment_data.\")\n        np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n        return\n    # Ensure keys present for BPI2017 and ROAD if available; limit large datasets by earliest 5000 cases for runtime\n    for key, df in datasets.items():\n        try:\n            starts = (\n                df.groupby(\"case_id\", as_index=False)[\"timestamp\"]\n                .min()\n                .sort_values(\"timestamp\")\n            )\n            if len(starts) > 5000:\n                keep_cases = set(starts.iloc[:5000][\"case_id\"])\n                df_small = df[df[\"case_id\"].isin(keep_cases)].copy()\n            else:\n                df_small = df\n        except Exception:\n            df_small = df\n        res = train_with_epoch_tuning(\n            key,\n            df_small,\n            base_epochs=40,\n            maybe_extend_to=60,\n            batch_size=256,\n            max_prefix_len=15,\n            lr=3e-4,\n        )\n        if res is not None:\n            experiment_data[key] = res\n            # also append per-epoch metrics to experiment_data for protocol\n            # Already contained in res under losses and val_curves\n    # Save consolidated experiment data\n    np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n\n\n# Execute immediately (no __main__ guard)\nmain()\n","plan":"The previous script failed to find local XES logs because it only searched a \u201cdata\u201d folder; I replaced the loader with a robust resolver that prioritizes the workspace \u201cinput/\u201d directory and supports both .xes and .xes.gz, matching BPI 2012/2017 and Road Traffic logs. I also fixed evaluation by excluding the PAD class from predictions (masking its logit) and added Expected Calibration Error (ECE) computation and tracking each epoch. Hyperparameters were tuned (more epochs, slightly larger prefix length, adjusted learning rate and batch size) without changing the LSTM architecture. The code enforces time-based splits, builds prefix features safely, computes required next-activity metrics (acc, macro-F1, top-3, ECE) per split and per dataset, and saves all artifacts under ./working.","overall_plan":"","plot_code":"import matplotlib.pyplot as plt\nimport numpy as np\nimport os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\n# Load experiment data\ntry:\n    experiment_data = np.load(\n        os.path.join(working_dir, \"experiment_data.npy\"), allow_pickle=True\n    ).item()\n    if not isinstance(experiment_data, dict):\n        raise ValueError(\"experiment_data.npy did not contain a dictionary.\")\nexcept Exception as e:\n    print(f\"Error loading experiment data: {e}\")\n    experiment_data = {}\n\n# Print metrics and plot\nfrom sklearn.metrics import confusion_matrix\nimport itertools\n\nfor ds_name, res in experiment_data.items():\n    print(f\"\\n=== {ds_name} Metrics ===\")\n    try:\n        test_metrics = dict(res.get(\"metrics\", {}).get(\"test\", [(\"final\", {})])[0][1])\n        print(\"Test metrics:\")\n        for k, v in test_metrics.items():\n            print(f\" - {k}: {v:.4f}\")\n    except Exception as e:\n        print(f\"Could not print metrics for {ds_name}: {e}\")\n\n    # 1) Train vs Val loss\n    try:\n        train_loss = np.array(res.get(\"losses\", {}).get(\"train\", []))\n        val_loss = np.array(res.get(\"losses\", {}).get(\"val\", []))\n        if train_loss.size > 0 or val_loss.size > 0:\n            plt.figure()\n            if train_loss.size > 0:\n                plt.plot(train_loss[:, 0], train_loss[:, 1], label=\"Train Loss\")\n            if val_loss.size > 0:\n                plt.plot(val_loss[:, 0], val_loss[:, 1], label=\"Val Loss\")\n            plt.xlabel(\"Epoch\")\n            plt.ylabel(\"Loss\")\n            plt.title(\n                f\"{ds_name} Training and Validation Loss\\nSubtitle: Time-based split, Next-Activity task\"\n            )\n            plt.legend()\n            out = os.path.join(working_dir, f\"{ds_name}_train_val_loss.png\")\n            plt.savefig(out)\n            plt.close()\n    except Exception as e:\n        print(f\"Error creating loss plot for {ds_name}: {e}\")\n        try:\n            plt.close()\n        except:\n            pass\n\n    # 2) Validation metric curves (acc, f1, top3, ece)\n    try:\n        val_curves = res.get(\"val_curves\", {})\n        have_any = any(\n            len(val_curves.get(k, [])) > 0 for k in [\"acc\", \"f1\", \"top3\", \"ece\"]\n        )\n        if have_any:\n            plt.figure()\n            for key, label in [\n                (\"acc\", \"Val Accuracy\"),\n                (\"f1\", \"Val Macro-F1\"),\n                (\"top3\", \"Val Top-3\"),\n                (\"ece\", \"Val ECE\"),\n            ]:\n                arr = np.array(val_curves.get(key, []))\n                if arr.size > 0:\n                    plt.plot(arr[:, 0], arr[:, 1], label=label)\n            plt.xlabel(\"Epoch\")\n            plt.ylabel(\"Metric value\")\n            plt.title(\n                f\"{ds_name} Validation Curves\\nSubtitle: Acc/F1/Top-3/ECE (Next-Activity)\"\n            )\n            plt.legend()\n            out = os.path.join(working_dir, f\"{ds_name}_val_curves.png\")\n            plt.savefig(out)\n            plt.close()\n    except Exception as e:\n        print(f\"Error creating validation curves for {ds_name}: {e}\")\n        try:\n            plt.close()\n        except:\n            pass\n\n    # 3) Confusion matrix (test)\n    try:\n        cm_path = os.path.join(working_dir, f\"{ds_name}_confusion_matrix.npy\")\n        cm = None\n        if os.path.exists(cm_path):\n            cm = np.load(cm_path)\n        else:\n            y_true = np.array(res.get(\"ground_truth\", []))\n            y_pred = np.array(res.get(\"predictions\", []))\n            if y_true.size > 0 and y_pred.size > 0:\n                cm = confusion_matrix(y_true, y_pred)\n        if cm is not None and cm.size > 0:\n            plt.figure()\n            plt.imshow(cm, interpolation=\"nearest\", cmap=plt.cm.Blues)\n            plt.title(\n                f\"{ds_name} Confusion Matrix (Test)\\nSubtitle: Next-Activity classification\"\n            )\n            plt.colorbar()\n            tick_marks = np.arange(min(20, cm.shape[0]))\n            # For readability, limit ticks if too many classes\n            if cm.shape[0] <= 20:\n                plt.xticks(np.arange(cm.shape[1]))\n                plt.yticks(np.arange(cm.shape[0]))\n            else:\n                plt.xticks(tick_marks)\n                plt.yticks(tick_marks)\n            plt.xlabel(\"Predicted label\")\n            plt.ylabel(\"True label\")\n            plt.tight_layout()\n            out = os.path.join(working_dir, f\"{ds_name}_confusion_matrix.png\")\n            plt.savefig(out)\n            plt.close()\n    except Exception as e:\n        print(f\"Error creating confusion matrix for {ds_name}: {e}\")\n        try:\n            plt.close()\n        except:\n            pass\n\n    # 4) Validation Top-3 zoomed (if available) to satisfy task-specific plot\n    try:\n        top3 = np.array(res.get(\"val_curves\", {}).get(\"top3\", []))\n        if top3.size > 0:\n            plt.figure()\n            plt.plot(top3[:, 0], top3[:, 1], label=\"Val Top-3 Accuracy\")\n            plt.xlabel(\"Epoch\")\n            plt.ylabel(\"Top-3 Accuracy\")\n            plt.title(\n                f\"{ds_name} Val Top-3 Accuracy over Epochs\\nSubtitle: Next-Activity task\"\n            )\n            plt.legend()\n            out = os.path.join(working_dir, f\"{ds_name}_val_top3.png\")\n            plt.savefig(out)\n            plt.close()\n    except Exception as e:\n        print(f\"Error creating top-3 plot for {ds_name}: {e}\")\n        try:\n            plt.close()\n        except:\n            pass\n\n# Also try to include any pre-saved per-dataset arrays if present (generic loader)\nfor ds_name in experiment_data.keys():\n    try:\n        # Already printed; nothing extra beyond constraints\n        pass\n    except Exception as e:\n        print(f\"Extra plotting error for {ds_name}: {e}\")\n\n# Print a brief summary table to stdout\nfor ds_name, res in experiment_data.items():\n    try:\n        tm = dict(res.get(\"metrics\", {}).get(\"test\", [(\"final\", {})])[0][1])\n        print(\n            f\"[Summary] {ds_name}: loss={tm.get('loss', np.nan):.4f}, acc={tm.get('acc', np.nan):.4f}, macro_f1={tm.get('macro_f1', np.nan):.4f}, top3={tm.get('top3', np.nan):.4f}, ece={tm.get('ece', np.nan):.4f}\"\n        )\n    except Exception as e:\n        print(f\"Error printing summary for {ds_name}: {e}\")\n","plot_plan":"We will analyze existing experiment_data.npy to report and visualize next-activity prediction results without re-running training. For each dataset stored, we will print consolidated BPM metrics (test loss, accuracy, macro-F1, top-3 accuracy, ECE) using the saved experiment_data dictionary. We will create standard visualizations that only use saved arrays: training vs validation loss over epochs, validation metric curves (accuracy, macro-F1, top-3, ECE), and the test confusion matrix. For confusion matrices, we will first try a saved matrix file per dataset; if missing, we compute it from saved y_true and y_pred in experiment_data.npy. We will save all plots into working_dir with descriptive filenames that include the dataset name and plot type. Each figure will be created in its own try-except block, titled clearly with the dataset and a subtitle indicating the plot content, and figures will always be closed after saving. We will also limit the number of figures to a maximum of five per dataset. Finally, the script will gracefully handle the absence of experiment_data.npy by reporting the error and exiting.","step":5,"id":"251df5cdee2b452db709366215875b0a","ctime":1757758927.310301,"_term_out":["Using device: cuda","\n","[data] Using discovered data dir: /workspace/data","\n","[data] Loading XES: /workspace/data/BPI_Challenge_2012.xes","\n","\rparsing log, completed traces ::   0%|          | 0/13087 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 1/13087 [00:00<24:33,  8.88it/s]","\rparsing log, completed traces ::   1%|1         | 150/13087 [00:00<00:15, 833.33it/s]","\rparsing log, completed traces ::   2%|2         | 299/13087 [00:00<00:11, 1123.60it/s]","\rparsing log, completed traces ::   3%|3         | 450/13087 [00:00<00:09, 1272.77it/s]","\rparsing log, completed traces ::   5%|4         | 610/13087 [00:00<00:08, 1387.11it/s]","\rparsing log, completed traces ::   6%|6         | 794/13087 [00:00<00:08, 1533.70it/s]","\rparsing log, completed traces ::   7%|7         | 949/13087 [00:00<00:07, 1536.25it/s]","\rparsing log, completed traces ::   8%|8         | 1106/13087 [00:00<00:07, 1544.88it/s]","\rparsing log, completed traces ::  10%|9         | 1270/13087 [00:00<00:07, 1569.51it/s]","\rparsing log, completed traces ::  11%|#1        | 1469/13087 [00:01<00:06, 1686.80it/s]","\rparsing log, completed traces ::  13%|#2        | 1638/13087 [00:01<00:13, 834.87it/s] ","\rparsing log, completed traces ::  14%|#3        | 1810/13087 [00:01<00:11, 990.64it/s]","\rparsing log, completed traces ::  15%|#4        | 1959/13087 [00:01<00:10, 1090.87it/s]","\rparsing log, completed traces ::  16%|#6        | 2119/13087 [00:01<00:09, 1200.83it/s]","\rparsing log, completed traces ::  17%|#7        | 2283/13087 [00:01<00:08, 1303.28it/s]","\rparsing log, completed traces ::  19%|#8        | 2465/13087 [00:01<00:07, 1430.15it/s]","\rparsing log, completed traces ::  20%|##        | 2632/13087 [00:02<00:07, 1493.31it/s]","\rparsing log, completed traces ::  21%|##1       | 2795/13087 [00:02<00:07, 1467.52it/s]","\rparsing log, completed traces ::  23%|##2       | 2951/13087 [00:02<00:06, 1465.06it/s]","\rparsing log, completed traces ::  24%|##3       | 3107/13087 [00:02<00:06, 1487.80it/s]","\rparsing log, completed traces ::  25%|##5       | 3312/13087 [00:02<00:05, 1646.90it/s]","\rparsing log, completed traces ::  27%|##6       | 3522/13087 [00:02<00:05, 1770.56it/s]","\rparsing log, completed traces ::  28%|##8       | 3703/13087 [00:02<00:05, 1768.23it/s]","\rparsing log, completed traces ::  30%|##9       | 3883/13087 [00:02<00:05, 1709.43it/s]","\rparsing log, completed traces ::  31%|###1      | 4102/13087 [00:02<00:04, 1846.72it/s]","\rparsing log, completed traces ::  33%|###3      | 4336/13087 [00:03<00:04, 1989.46it/s]","\rparsing log, completed traces ::  35%|###4      | 4537/13087 [00:03<00:08, 1020.20it/s]","\rparsing log, completed traces ::  36%|###6      | 4717/13087 [00:03<00:07, 1157.26it/s]","\rparsing log, completed traces ::  37%|###7      | 4885/13087 [00:03<00:06, 1262.16it/s]","\rparsing log, completed traces ::  39%|###8      | 5049/13087 [00:03<00:06, 1242.02it/s]","\rparsing log, completed traces ::  40%|###9      | 5200/13087 [00:03<00:06, 1285.09it/s]","\rparsing log, completed traces ::  41%|####      | 5359/13087 [00:03<00:05, 1356.59it/s]","\rparsing log, completed traces ::  42%|####2     | 5510/13087 [00:04<00:05, 1380.47it/s]","\rparsing log, completed traces ::  43%|####3     | 5673/13087 [00:04<00:05, 1446.16it/s]","\rparsing log, completed traces ::  45%|####4     | 5827/13087 [00:04<00:04, 1453.37it/s]","\rparsing log, completed traces ::  46%|####5     | 6010/13087 [00:04<00:04, 1558.60it/s]","\rparsing log, completed traces ::  47%|####7     | 6171/13087 [00:04<00:04, 1550.43it/s]","\rparsing log, completed traces ::  48%|####8     | 6336/13087 [00:04<00:04, 1577.87it/s]","\rparsing log, completed traces ::  50%|####9     | 6497/13087 [00:04<00:04, 1349.60it/s]","\rparsing log, completed traces ::  51%|#####     | 6650/13087 [00:04<00:04, 1396.42it/s]","\rparsing log, completed traces ::  52%|#####1    | 6801/13087 [00:04<00:04, 1426.84it/s]","\rparsing log, completed traces ::  53%|#####3    | 6949/13087 [00:05<00:04, 1384.06it/s]","\rparsing log, completed traces ::  54%|#####4    | 7114/13087 [00:05<00:04, 1457.57it/s]","\rparsing log, completed traces ::  56%|#####5    | 7279/13087 [00:05<00:03, 1510.46it/s]","\rparsing log, completed traces ::  57%|#####6    | 7433/13087 [00:05<00:03, 1494.75it/s]","\rparsing log, completed traces ::  58%|#####7    | 7585/13087 [00:05<00:07, 725.32it/s] ","\rparsing log, completed traces ::  59%|#####9    | 7736/13087 [00:05<00:06, 855.23it/s]","\rparsing log, completed traces ::  60%|######    | 7887/13087 [00:06<00:05, 980.21it/s]","\rparsing log, completed traces ::  61%|######1   | 8032/13087 [00:06<00:04, 1080.99it/s]","\rparsing log, completed traces ::  63%|######2   | 8201/13087 [00:06<00:03, 1223.52it/s]","\rparsing log, completed traces ::  64%|######3   | 8375/13087 [00:06<00:03, 1350.38it/s]","\rparsing log, completed traces ::  65%|######5   | 8539/13087 [00:06<00:03, 1420.55it/s]","\rparsing log, completed traces ::  67%|######6   | 8715/13087 [00:06<00:02, 1504.36it/s]","\rparsing log, completed traces ::  68%|######7   | 8877/13087 [00:06<00:02, 1514.70it/s]","\rparsing log, completed traces ::  69%|######9   | 9037/13087 [00:06<00:02, 1535.42it/s]","\rparsing log, completed traces ::  70%|#######   | 9196/13087 [00:06<00:02, 1548.97it/s]","\rparsing log, completed traces ::  72%|#######1  | 9376/13087 [00:06<00:02, 1618.47it/s]","\rparsing log, completed traces ::  73%|#######2  | 9541/13087 [00:07<00:02, 1558.88it/s]","\rparsing log, completed traces ::  74%|#######4  | 9700/13087 [00:07<00:02, 1561.85it/s]","\rparsing log, completed traces ::  75%|#######5  | 9876/13087 [00:07<00:01, 1619.09it/s]","\rparsing log, completed traces ::  77%|#######6  | 10040/13087 [00:07<00:01, 1580.95it/s]","\rparsing log, completed traces ::  78%|#######7  | 10200/13087 [00:07<00:01, 1565.83it/s]","\rparsing log, completed traces ::  79%|#######9  | 10358/13087 [00:07<00:01, 1540.05it/s]","\rparsing log, completed traces ::  80%|########  | 10513/13087 [00:07<00:01, 1493.08it/s]","\rparsing log, completed traces ::  82%|########1 | 10673/13087 [00:07<00:01, 1513.59it/s]","\rparsing log, completed traces ::  83%|########2 | 10840/13087 [00:07<00:01, 1555.75it/s]","\rparsing log, completed traces ::  84%|########4 | 10997/13087 [00:08<00:02, 705.46it/s] ","\rparsing log, completed traces ::  85%|########5 | 11166/13087 [00:08<00:02, 861.18it/s]","\rparsing log, completed traces ::  87%|########6 | 11338/13087 [00:08<00:01, 1017.62it/s]","\rparsing log, completed traces ::  88%|########8 | 11524/13087 [00:08<00:01, 1190.65it/s]","\rparsing log, completed traces ::  89%|########9 | 11700/13087 [00:08<00:01, 1320.85it/s]","\rparsing log, completed traces ::  91%|######### | 11890/13087 [00:08<00:00, 1463.25it/s]","\rparsing log, completed traces ::  92%|#########2| 12069/13087 [00:09<00:00, 1540.97it/s]","\rparsing log, completed traces ::  94%|#########3| 12279/13087 [00:09<00:00, 1690.19it/s]","\rparsing log, completed traces ::  95%|#########5| 12463/13087 [00:09<00:00, 1724.22it/s]","\rparsing log, completed traces ::  97%|#########6| 12659/13087 [00:09<00:00, 1789.58it/s]","\rparsing log, completed traces ::  98%|#########8| 12846/13087 [00:09<00:00, 1806.72it/s]","\rparsing log, completed traces :: 100%|#########9| 13037/13087 [00:09<00:00, 1828.81it/s]","","\rparsing log, completed traces :: 100%|##########| 13087/13087 [00:09<00:00, 1370.22it/s]","\n","[data] Loaded BPI2012: events=262200, cases=13087","\n","[data] Loading XES: /workspace/data/BPI_Challenge_2017.xes","\n","\rparsing log, completed traces ::   0%|          | 0/31509 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 1/31509 [00:00<4:56:09,  1.77it/s]","\rparsing log, completed traces ::   0%|          | 66/31509 [00:00<03:57, 132.28it/s]","\rparsing log, completed traces ::   0%|          | 121/31509 [00:00<02:19, 224.97it/s]","\rparsing log, completed traces ::   1%|          | 185/31509 [00:00<01:36, 323.52it/s]","\rparsing log, completed traces ::   1%|          | 246/31509 [00:00<01:18, 396.23it/s]","\rparsing log, completed traces ::   1%|          | 308/31509 [00:01<01:08, 455.00it/s]","\rparsing log, completed traces ::   1%|1         | 368/31509 [00:01<01:03, 492.77it/s]","\rparsing log, completed traces ::   1%|1         | 429/31509 [00:01<00:59, 525.56it/s]","\rparsing log, completed traces ::   2%|1         | 488/31509 [00:01<00:57, 543.36it/s]","\rparsing log, completed traces ::   2%|1         | 547/31509 [00:01<00:56, 548.90it/s]","\rparsing log, completed traces ::   2%|1         | 608/31509 [00:01<00:54, 562.89it/s]","\rparsing log, completed traces ::   2%|2         | 677/31509 [00:01<00:51, 598.88it/s]","\rparsing log, completed traces ::   2%|2         | 739/31509 [00:01<00:51, 603.24it/s]","\rparsing log, completed traces ::   3%|2         | 801/31509 [00:01<00:51, 601.14it/s]","\rparsing log, completed traces ::   3%|2         | 862/31509 [00:02<01:38, 310.63it/s]","\rparsing log, completed traces ::   3%|2         | 927/31509 [00:02<01:22, 370.74it/s]","\rparsing log, completed traces ::   3%|3         | 994/31509 [00:02<01:10, 431.11it/s]","\rparsing log, completed traces ::   3%|3         | 1053/31509 [00:02<01:05, 466.55it/s]","\rparsing log, completed traces ::   4%|3         | 1116/31509 [00:02<01:00, 502.89it/s]","\rparsing log, completed traces ::   4%|3         | 1181/31509 [00:02<00:56, 540.22it/s]","\rparsing log, completed traces ::   4%|3         | 1249/31509 [00:02<00:52, 575.37it/s]","\rparsing log, completed traces ::   4%|4         | 1312/31509 [00:03<00:52, 578.79it/s]","\rparsing log, completed traces ::   4%|4         | 1382/31509 [00:03<00:49, 611.46it/s]","\rparsing log, completed traces ::   5%|4         | 1446/31509 [00:03<00:50, 591.51it/s]","\rparsing log, completed traces ::   5%|4         | 1508/31509 [00:03<00:50, 594.41it/s]","\rparsing log, completed traces ::   5%|4         | 1572/31509 [00:03<00:49, 606.69it/s]","\rparsing log, completed traces ::   5%|5         | 1635/31509 [00:03<00:48, 611.02it/s]","\rparsing log, completed traces ::   5%|5         | 1697/31509 [00:03<00:49, 605.62it/s]","\rparsing log, completed traces ::   6%|5         | 1760/31509 [00:03<00:48, 609.41it/s]","\rparsing log, completed traces ::   6%|5         | 1822/31509 [00:03<00:50, 589.71it/s]","\rparsing log, completed traces ::   6%|5         | 1882/31509 [00:03<00:50, 587.51it/s]","\rparsing log, completed traces ::   6%|6         | 1945/31509 [00:04<00:49, 597.01it/s]","\rparsing log, completed traces ::   6%|6         | 2005/31509 [00:04<01:36, 307.00it/s]","\rparsing log, completed traces ::   7%|6         | 2065/31509 [00:04<01:22, 358.39it/s]","\rparsing log, completed traces ::   7%|6         | 2129/31509 [00:04<01:10, 414.21it/s]","\rparsing log, completed traces ::   7%|6         | 2193/31509 [00:04<01:03, 463.06it/s]","\rparsing log, completed traces ::   7%|7         | 2259/31509 [00:04<00:57, 510.43it/s]","\rparsing log, completed traces ::   7%|7         | 2324/31509 [00:04<00:53, 546.05it/s]","\rparsing log, completed traces ::   8%|7         | 2386/31509 [00:05<00:51, 564.69it/s]","\rparsing log, completed traces ::   8%|7         | 2450/31509 [00:05<00:49, 584.58it/s]","\rparsing log, completed traces ::   8%|7         | 2514/31509 [00:05<00:48, 600.19it/s]","\rparsing log, completed traces ::   8%|8         | 2586/31509 [00:05<00:45, 633.21it/s]","\rparsing log, completed traces ::   8%|8         | 2653/31509 [00:05<00:44, 643.74it/s]","\rparsing log, completed traces ::   9%|8         | 2719/31509 [00:05<00:45, 633.11it/s]","\rparsing log, completed traces ::   9%|8         | 2788/31509 [00:05<00:44, 648.84it/s]","\rparsing log, completed traces ::   9%|9         | 2859/31509 [00:05<00:43, 665.18it/s]","\rparsing log, completed traces ::   9%|9         | 2929/31509 [00:05<00:42, 671.68it/s]","\rparsing log, completed traces ::  10%|9         | 3002/31509 [00:06<00:41, 686.86it/s]","\rparsing log, completed traces ::  10%|9         | 3071/31509 [00:06<00:43, 661.04it/s]","\rparsing log, completed traces ::  10%|9         | 3138/31509 [00:06<00:43, 651.42it/s]","\rparsing log, completed traces ::  10%|#         | 3204/31509 [00:06<00:44, 638.66it/s]","\rparsing log, completed traces ::  10%|#         | 3273/31509 [00:06<00:43, 651.99it/s]","\rparsing log, completed traces ::  11%|#         | 3339/31509 [00:06<01:25, 327.80it/s]","\rparsing log, completed traces ::  11%|#         | 3409/31509 [00:06<01:11, 391.00it/s]","\rparsing log, completed traces ::  11%|#1        | 3480/31509 [00:07<01:01, 453.30it/s]","\rparsing log, completed traces ::  11%|#1        | 3545/31509 [00:07<00:56, 495.11it/s]","\rparsing log, completed traces ::  11%|#1        | 3614/31509 [00:07<00:51, 540.75it/s]","\rparsing log, completed traces ::  12%|#1        | 3683/31509 [00:07<00:48, 575.12it/s]","\rparsing log, completed traces ::  12%|#1        | 3751/31509 [00:07<00:46, 601.16it/s]","\rparsing log, completed traces ::  12%|#2        | 3817/31509 [00:07<00:45, 607.75it/s]","\rparsing log, completed traces ::  12%|#2        | 3884/31509 [00:07<00:44, 624.36it/s]","\rparsing log, completed traces ::  13%|#2        | 3952/31509 [00:07<00:43, 639.00it/s]","\rparsing log, completed traces ::  13%|#2        | 4021/31509 [00:07<00:42, 653.56it/s]","\rparsing log, completed traces ::  13%|#2        | 4088/31509 [00:08<00:42, 647.53it/s]","\rparsing log, completed traces ::  13%|#3        | 4156/31509 [00:08<00:41, 656.54it/s]","\rparsing log, completed traces ::  13%|#3        | 4223/31509 [00:08<00:42, 648.02it/s]","\rparsing log, completed traces ::  14%|#3        | 4289/31509 [00:08<00:43, 632.44it/s]","\rparsing log, completed traces ::  14%|#3        | 4355/31509 [00:08<00:42, 639.30it/s]","\rparsing log, completed traces ::  14%|#4        | 4423/31509 [00:08<00:41, 650.07it/s]","\rparsing log, completed traces ::  14%|#4        | 4489/31509 [00:08<00:42, 636.20it/s]","\rparsing log, completed traces ::  14%|#4        | 4553/31509 [00:08<00:42, 635.28it/s]","\rparsing log, completed traces ::  15%|#4        | 4619/31509 [00:08<00:42, 639.19it/s]","\rparsing log, completed traces ::  15%|#4        | 4689/31509 [00:08<00:40, 656.49it/s]","\rparsing log, completed traces ::  15%|#5        | 4761/31509 [00:09<00:39, 673.58it/s]","\rparsing log, completed traces ::  15%|#5        | 4829/31509 [00:09<01:28, 301.60it/s]","\rparsing log, completed traces ::  16%|#5        | 4895/31509 [00:09<01:14, 357.84it/s]","\rparsing log, completed traces ::  16%|#5        | 4962/31509 [00:09<01:04, 413.88it/s]","\rparsing log, completed traces ::  16%|#5        | 5031/31509 [00:09<00:56, 470.63it/s]","\rparsing log, completed traces ::  16%|#6        | 5104/31509 [00:09<00:49, 529.56it/s]","\rparsing log, completed traces ::  16%|#6        | 5169/31509 [00:10<00:47, 553.65it/s]","\rparsing log, completed traces ::  17%|#6        | 5240/31509 [00:10<00:44, 593.44it/s]","\rparsing log, completed traces ::  17%|#6        | 5307/31509 [00:10<00:43, 608.96it/s]","\rparsing log, completed traces ::  17%|#7        | 5374/31509 [00:10<00:41, 622.31it/s]","\rparsing log, completed traces ::  17%|#7        | 5441/31509 [00:10<00:41, 633.73it/s]","\rparsing log, completed traces ::  17%|#7        | 5513/31509 [00:10<00:39, 657.72it/s]","\rparsing log, completed traces ::  18%|#7        | 5583/31509 [00:10<00:38, 669.46it/s]","\rparsing log, completed traces ::  18%|#7        | 5656/31509 [00:10<00:37, 686.02it/s]","\rparsing log, completed traces ::  18%|#8        | 5732/31509 [00:10<00:36, 704.77it/s]","\rparsing log, completed traces ::  18%|#8        | 5804/31509 [00:10<00:36, 695.83it/s]","\rparsing log, completed traces ::  19%|#8        | 5876/31509 [00:11<00:36, 702.07it/s]","\rparsing log, completed traces ::  19%|#8        | 5953/31509 [00:11<00:35, 716.93it/s]","\rparsing log, completed traces ::  19%|#9        | 6025/31509 [00:11<00:36, 691.00it/s]","\rparsing log, completed traces ::  19%|#9        | 6095/31509 [00:11<00:37, 679.59it/s]","\rparsing log, completed traces ::  20%|#9        | 6166/31509 [00:11<00:36, 687.73it/s]","\rparsing log, completed traces ::  20%|#9        | 6235/31509 [00:11<00:36, 687.86it/s]","\rparsing log, completed traces ::  20%|##        | 6304/31509 [00:11<00:37, 672.11it/s]","\rparsing log, completed traces ::  20%|##        | 6373/31509 [00:11<00:37, 676.68it/s]","\rparsing log, completed traces ::  20%|##        | 6441/31509 [00:11<00:37, 669.74it/s]","\rparsing log, completed traces ::  21%|##        | 6509/31509 [00:12<01:25, 291.64it/s]","\rparsing log, completed traces ::  21%|##        | 6564/31509 [00:12<01:15, 330.82it/s]","\rparsing log, completed traces ::  21%|##1       | 6631/31509 [00:12<01:03, 390.68it/s]","\rparsing log, completed traces ::  21%|##1       | 6697/31509 [00:12<00:55, 445.46it/s]","\rparsing log, completed traces ::  21%|##1       | 6763/31509 [00:12<00:50, 493.36it/s]","\rparsing log, completed traces ::  22%|##1       | 6831/31509 [00:12<00:46, 535.31it/s]","\rparsing log, completed traces ::  22%|##1       | 6895/31509 [00:13<00:43, 562.15it/s]","\rparsing log, completed traces ::  22%|##2       | 6961/31509 [00:13<00:41, 586.44it/s]","\rparsing log, completed traces ::  22%|##2       | 7034/31509 [00:13<00:39, 625.03it/s]","\rparsing log, completed traces ::  23%|##2       | 7101/31509 [00:13<00:38, 629.20it/s]","\rparsing log, completed traces ::  23%|##2       | 7167/31509 [00:13<00:38, 634.41it/s]","\rparsing log, completed traces ::  23%|##2       | 7233/31509 [00:13<00:38, 629.55it/s]","\rparsing log, completed traces ::  23%|##3       | 7300/31509 [00:13<00:37, 639.01it/s]","\rparsing log, completed traces ::  23%|##3       | 7365/31509 [00:13<00:37, 637.51it/s]","\rparsing log, completed traces ::  24%|##3       | 7430/31509 [00:13<00:37, 640.89it/s]","\rparsing log, completed traces ::  24%|##3       | 7498/31509 [00:13<00:36, 650.53it/s]","\rparsing log, completed traces ::  24%|##4       | 7571/31509 [00:14<00:35, 667.06it/s]","\rparsing log, completed traces ::  24%|##4       | 7638/31509 [00:14<00:36, 650.52it/s]","\rparsing log, completed traces ::  24%|##4       | 7704/31509 [00:14<00:36, 650.00it/s]","\rparsing log, completed traces ::  25%|##4       | 7770/31509 [00:14<00:37, 637.52it/s]","\rparsing log, completed traces ::  25%|##4       | 7837/31509 [00:14<00:36, 644.98it/s]","\rparsing log, completed traces ::  25%|##5       | 7907/31509 [00:14<00:35, 660.62it/s]","\rparsing log, completed traces ::  25%|##5       | 7974/31509 [00:14<00:35, 662.96it/s]","\rparsing log, completed traces ::  26%|##5       | 8042/31509 [00:14<00:35, 666.50it/s]","\rparsing log, completed traces ::  26%|##5       | 8109/31509 [00:14<00:35, 659.72it/s]","\rparsing log, completed traces ::  26%|##5       | 8178/31509 [00:15<00:34, 666.88it/s]","\rparsing log, completed traces ::  26%|##6       | 8245/31509 [00:15<00:34, 666.63it/s]","\rparsing log, completed traces ::  26%|##6       | 8312/31509 [00:15<01:28, 260.86it/s]","\rparsing log, completed traces ::  27%|##6       | 8376/31509 [00:15<01:13, 314.65it/s]","\rparsing log, completed traces ::  27%|##6       | 8439/31509 [00:15<01:02, 367.13it/s]","\rparsing log, completed traces ::  27%|##7       | 8508/31509 [00:16<00:53, 429.70it/s]","\rparsing log, completed traces ::  27%|##7       | 8569/31509 [00:16<00:49, 465.14it/s]","\rparsing log, completed traces ::  27%|##7       | 8636/31509 [00:16<00:44, 512.38it/s]","\rparsing log, completed traces ::  28%|##7       | 8702/31509 [00:16<00:41, 547.06it/s]","\rparsing log, completed traces ::  28%|##7       | 8769/31509 [00:16<00:39, 579.29it/s]","\rparsing log, completed traces ::  28%|##8       | 8835/31509 [00:16<00:37, 598.76it/s]","\rparsing log, completed traces ::  28%|##8       | 8900/31509 [00:16<00:37, 609.41it/s]","\rparsing log, completed traces ::  28%|##8       | 8965/31509 [00:16<00:36, 619.97it/s]","\rparsing log, completed traces ::  29%|##8       | 9030/31509 [00:16<00:36, 609.24it/s]","\rparsing log, completed traces ::  29%|##8       | 9094/31509 [00:16<00:36, 617.29it/s]","\rparsing log, completed traces ::  29%|##9       | 9159/31509 [00:17<00:35, 626.57it/s]","\rparsing log, completed traces ::  29%|##9       | 9223/31509 [00:17<00:36, 616.93it/s]","\rparsing log, completed traces ::  29%|##9       | 9286/31509 [00:17<00:36, 616.76it/s]","\rparsing log, completed traces ::  30%|##9       | 9356/31509 [00:17<00:34, 638.65it/s]","\rparsing log, completed traces ::  30%|##9       | 9421/31509 [00:17<00:35, 630.11it/s]","\rparsing log, completed traces ::  30%|###       | 9485/31509 [00:17<00:35, 623.96it/s]","\rparsing log, completed traces ::  30%|###       | 9552/31509 [00:17<00:34, 635.09it/s]","\rparsing log, completed traces ::  31%|###       | 9616/31509 [00:17<00:34, 631.99it/s]","\rparsing log, completed traces ::  31%|###       | 9680/31509 [00:17<00:34, 629.57it/s]","\rparsing log, completed traces ::  31%|###       | 9744/31509 [00:18<00:35, 614.98it/s]","\rparsing log, completed traces ::  31%|###1      | 9808/31509 [00:18<00:34, 621.98it/s]","\rparsing log, completed traces ::  31%|###1      | 9871/31509 [00:18<00:34, 620.49it/s]","\rparsing log, completed traces ::  32%|###1      | 9934/31509 [00:18<00:34, 619.96it/s]","\rparsing log, completed traces ::  32%|###1      | 9997/31509 [00:18<00:35, 612.46it/s]","\rparsing log, completed traces ::  32%|###1      | 10060/31509 [00:18<00:35, 609.82it/s]","\rparsing log, completed traces ::  32%|###2      | 10122/31509 [00:18<00:35, 598.09it/s]","\rparsing log, completed traces ::  32%|###2      | 10186/31509 [00:18<00:35, 608.19it/s]","\rparsing log, completed traces ::  33%|###2      | 10254/31509 [00:18<00:33, 627.85it/s]","\rparsing log, completed traces ::  33%|###2      | 10317/31509 [00:19<01:31, 230.35it/s]","\rparsing log, completed traces ::  33%|###2      | 10375/31509 [00:19<01:16, 276.44it/s]","\rparsing log, completed traces ::  33%|###3      | 10439/31509 [00:19<01:03, 334.43it/s]","\rparsing log, completed traces ::  33%|###3      | 10497/31509 [00:19<00:55, 379.58it/s]","\rparsing log, completed traces ::  34%|###3      | 10558/31509 [00:19<00:48, 427.73it/s]","\rparsing log, completed traces ::  34%|###3      | 10618/31509 [00:20<00:44, 466.87it/s]","\rparsing log, completed traces ::  34%|###3      | 10680/31509 [00:20<00:41, 503.37it/s]","\rparsing log, completed traces ::  34%|###4      | 10741/31509 [00:20<00:39, 531.07it/s]","\rparsing log, completed traces ::  34%|###4      | 10801/31509 [00:20<00:38, 534.38it/s]","\rparsing log, completed traces ::  34%|###4      | 10859/31509 [00:20<00:38, 533.95it/s]","\rparsing log, completed traces ::  35%|###4      | 10921/31509 [00:20<00:36, 557.54it/s]","\rparsing log, completed traces ::  35%|###4      | 10981/31509 [00:20<00:36, 568.21it/s]","\rparsing log, completed traces ::  35%|###5      | 11044/31509 [00:20<00:34, 585.50it/s]","\rparsing log, completed traces ::  35%|###5      | 11107/31509 [00:20<00:34, 597.79it/s]","\rparsing log, completed traces ::  35%|###5      | 11171/31509 [00:20<00:33, 608.25it/s]","\rparsing log, completed traces ::  36%|###5      | 11237/31509 [00:21<00:32, 621.72it/s]","\rparsing log, completed traces ::  36%|###5      | 11302/31509 [00:21<00:32, 629.63it/s]","\rparsing log, completed traces ::  36%|###6      | 11366/31509 [00:21<00:33, 609.75it/s]","\rparsing log, completed traces ::  36%|###6      | 11428/31509 [00:21<00:32, 610.12it/s]","\rparsing log, completed traces ::  36%|###6      | 11491/31509 [00:21<00:32, 614.43it/s]","\rparsing log, completed traces ::  37%|###6      | 11553/31509 [00:21<00:33, 602.02it/s]","\rparsing log, completed traces ::  37%|###6      | 11616/31509 [00:21<00:32, 609.99it/s]","\rparsing log, completed traces ::  37%|###7      | 11679/31509 [00:21<00:32, 612.69it/s]","\rparsing log, completed traces ::  37%|###7      | 11745/31509 [00:21<00:31, 624.46it/s]","\rparsing log, completed traces ::  37%|###7      | 11811/31509 [00:21<00:31, 632.45it/s]","\rparsing log, completed traces ::  38%|###7      | 11878/31509 [00:22<00:30, 640.83it/s]","\rparsing log, completed traces ::  38%|###7      | 11947/31509 [00:22<00:29, 655.25it/s]","\rparsing log, completed traces ::  38%|###8      | 12013/31509 [00:22<00:30, 646.07it/s]","\rparsing log, completed traces ::  38%|###8      | 12078/31509 [00:22<00:30, 645.80it/s]","\rparsing log, completed traces ::  39%|###8      | 12143/31509 [00:22<00:30, 641.31it/s]","\rparsing log, completed traces ::  39%|###8      | 12208/31509 [00:22<00:30, 640.49it/s]","\rparsing log, completed traces ::  39%|###8      | 12273/31509 [00:22<00:30, 637.55it/s]","\rparsing log, completed traces ::  39%|###9      | 12340/31509 [00:22<00:29, 646.01it/s]","\rparsing log, completed traces ::  39%|###9      | 12405/31509 [00:22<00:29, 638.38it/s]","\rparsing log, completed traces ::  40%|###9      | 12470/31509 [00:23<01:22, 229.55it/s]","\rparsing log, completed traces ::  40%|###9      | 12531/31509 [00:23<01:08, 278.97it/s]","\rparsing log, completed traces ::  40%|###9      | 12593/31509 [00:23<00:56, 332.22it/s]","\rparsing log, completed traces ::  40%|####      | 12656/31509 [00:23<00:48, 386.13it/s]","\rparsing log, completed traces ::  40%|####      | 12725/31509 [00:24<00:41, 448.12it/s]","\rparsing log, completed traces ::  41%|####      | 12786/31509 [00:24<00:39, 476.62it/s]","\rparsing log, completed traces ::  41%|####      | 12848/31509 [00:24<00:36, 509.83it/s]","\rparsing log, completed traces ::  41%|####      | 12909/31509 [00:24<00:34, 535.05it/s]","\rparsing log, completed traces ::  41%|####1     | 12973/31509 [00:24<00:32, 562.01it/s]","\rparsing log, completed traces ::  41%|####1     | 13039/31509 [00:24<00:31, 587.79it/s]","\rparsing log, completed traces ::  42%|####1     | 13111/31509 [00:24<00:29, 624.12it/s]","\rparsing log, completed traces ::  42%|####1     | 13177/31509 [00:24<00:29, 615.71it/s]","\rparsing log, completed traces ::  42%|####2     | 13241/31509 [00:24<00:29, 615.47it/s]","\rparsing log, completed traces ::  42%|####2     | 13305/31509 [00:24<00:29, 619.38it/s]","\rparsing log, completed traces ::  42%|####2     | 13370/31509 [00:25<00:29, 625.10it/s]","\rparsing log, completed traces ::  43%|####2     | 13434/31509 [00:25<00:28, 629.06it/s]","\rparsing log, completed traces ::  43%|####2     | 13498/31509 [00:25<00:28, 627.69it/s]","\rparsing log, completed traces ::  43%|####3     | 13562/31509 [00:25<00:28, 625.44it/s]","\rparsing log, completed traces ::  43%|####3     | 13625/31509 [00:25<00:29, 615.26it/s]","\rparsing log, completed traces ::  43%|####3     | 13688/31509 [00:25<00:28, 617.37it/s]","\rparsing log, completed traces ::  44%|####3     | 13753/31509 [00:25<00:28, 626.77it/s]","\rparsing log, completed traces ::  44%|####3     | 13817/31509 [00:25<00:28, 629.93it/s]","\rparsing log, completed traces ::  44%|####4     | 13881/31509 [00:25<00:28, 622.09it/s]","\rparsing log, completed traces ::  44%|####4     | 13948/31509 [00:25<00:27, 634.22it/s]","\rparsing log, completed traces ::  44%|####4     | 14012/31509 [00:26<00:27, 626.41it/s]","\rparsing log, completed traces ::  45%|####4     | 14080/31509 [00:26<00:27, 640.85it/s]","\rparsing log, completed traces ::  45%|####4     | 14146/31509 [00:26<00:26, 646.03it/s]","\rparsing log, completed traces ::  45%|####5     | 14211/31509 [00:26<00:27, 640.57it/s]","\rparsing log, completed traces ::  45%|####5     | 14277/31509 [00:26<00:26, 644.01it/s]","\rparsing log, completed traces ::  46%|####5     | 14345/31509 [00:26<00:26, 653.74it/s]","\rparsing log, completed traces ::  46%|####5     | 14415/31509 [00:26<00:25, 665.51it/s]","\rparsing log, completed traces ::  46%|####5     | 14482/31509 [00:26<00:25, 657.13it/s]","\rparsing log, completed traces ::  46%|####6     | 14548/31509 [00:26<00:26, 631.51it/s]","\rparsing log, completed traces ::  46%|####6     | 14612/31509 [00:26<00:26, 628.28it/s]","\rparsing log, completed traces ::  47%|####6     | 14676/31509 [00:27<00:26, 630.32it/s]","\rparsing log, completed traces ::  47%|####6     | 14742/31509 [00:27<00:26, 635.59it/s]","\rparsing log, completed traces ::  47%|####7     | 14812/31509 [00:27<00:25, 653.31it/s]","\rparsing log, completed traces ::  47%|####7     | 14878/31509 [00:27<00:25, 641.64it/s]","\rparsing log, completed traces ::  47%|####7     | 14953/31509 [00:27<00:24, 671.44it/s]","\rparsing log, completed traces ::  48%|####7     | 15021/31509 [00:28<01:13, 222.87it/s]","\rparsing log, completed traces ::  48%|####7     | 15096/31509 [00:28<00:57, 287.11it/s]","\rparsing log, completed traces ::  48%|####8     | 15160/31509 [00:28<00:48, 338.94it/s]","\rparsing log, completed traces ::  48%|####8     | 15221/31509 [00:28<00:42, 386.18it/s]","\rparsing log, completed traces ::  49%|####8     | 15291/31509 [00:28<00:36, 448.39it/s]","\rparsing log, completed traces ::  49%|####8     | 15359/31509 [00:28<00:32, 497.96it/s]","\rparsing log, completed traces ::  49%|####8     | 15426/31509 [00:28<00:29, 536.96it/s]","\rparsing log, completed traces ::  49%|####9     | 15492/31509 [00:28<00:28, 568.18it/s]","\rparsing log, completed traces ::  49%|####9     | 15561/31509 [00:29<00:26, 600.00it/s]","\rparsing log, completed traces ::  50%|####9     | 15630/31509 [00:29<00:25, 624.37it/s]","\rparsing log, completed traces ::  50%|####9     | 15698/31509 [00:29<00:24, 636.56it/s]","\rparsing log, completed traces ::  50%|#####     | 15765/31509 [00:29<00:24, 629.95it/s]","\rparsing log, completed traces ::  50%|#####     | 15831/31509 [00:29<00:24, 629.86it/s]","\rparsing log, completed traces ::  50%|#####     | 15900/31509 [00:29<00:24, 646.55it/s]","\rparsing log, completed traces ::  51%|#####     | 15966/31509 [00:29<00:24, 645.31it/s]","\rparsing log, completed traces ::  51%|#####     | 16032/31509 [00:29<00:24, 639.34it/s]","\rparsing log, completed traces ::  51%|#####1    | 16101/31509 [00:29<00:23, 653.87it/s]","\rparsing log, completed traces ::  51%|#####1    | 16173/31509 [00:30<00:22, 672.84it/s]","\rparsing log, completed traces ::  52%|#####1    | 16241/31509 [00:30<00:23, 662.46it/s]","\rparsing log, completed traces ::  52%|#####1    | 16310/31509 [00:30<00:22, 669.86it/s]","\rparsing log, completed traces ::  52%|#####1    | 16378/31509 [00:30<00:23, 640.10it/s]","\rparsing log, completed traces ::  52%|#####2    | 16443/31509 [00:30<00:23, 636.89it/s]","\rparsing log, completed traces ::  52%|#####2    | 16507/31509 [00:30<00:24, 612.94it/s]","\rparsing log, completed traces ::  53%|#####2    | 16573/31509 [00:30<00:23, 625.84it/s]","\rparsing log, completed traces ::  53%|#####2    | 16640/31509 [00:30<00:23, 636.01it/s]","\rparsing log, completed traces ::  53%|#####3    | 16710/31509 [00:30<00:22, 652.58it/s]","\rparsing log, completed traces ::  53%|#####3    | 16776/31509 [00:30<00:22, 642.72it/s]","\rparsing log, completed traces ::  53%|#####3    | 16841/31509 [00:31<00:22, 644.36it/s]","\rparsing log, completed traces ::  54%|#####3    | 16906/31509 [00:31<00:22, 645.50it/s]","\rparsing log, completed traces ::  54%|#####3    | 16973/31509 [00:31<00:22, 649.63it/s]","\rparsing log, completed traces ::  54%|#####4    | 17044/31509 [00:31<00:21, 667.37it/s]","\rparsing log, completed traces ::  54%|#####4    | 17111/31509 [00:31<00:21, 662.97it/s]","\rparsing log, completed traces ::  55%|#####4    | 17178/31509 [00:31<00:21, 661.39it/s]","\rparsing log, completed traces ::  55%|#####4    | 17245/31509 [00:31<00:21, 652.07it/s]","\rparsing log, completed traces ::  55%|#####4    | 17312/31509 [00:31<00:21, 656.94it/s]","\rparsing log, completed traces ::  55%|#####5    | 17378/31509 [00:31<00:21, 654.60it/s]","\rparsing log, completed traces ::  55%|#####5    | 17450/31509 [00:31<00:20, 672.29it/s]","\rparsing log, completed traces ::  56%|#####5    | 17518/31509 [00:32<00:21, 642.04it/s]","\rparsing log, completed traces ::  56%|#####5    | 17588/31509 [00:32<00:21, 656.23it/s]","\rparsing log, completed traces ::  56%|#####6    | 17660/31509 [00:32<00:20, 673.59it/s]","\rparsing log, completed traces ::  56%|#####6    | 17728/31509 [00:32<00:20, 667.59it/s]","\rparsing log, completed traces ::  56%|#####6    | 17795/31509 [00:32<00:20, 667.54it/s]","\rparsing log, completed traces ::  57%|#####6    | 17865/31509 [00:32<00:20, 676.72it/s]","\rparsing log, completed traces ::  57%|#####6    | 17933/31509 [00:32<00:20, 668.02it/s]","\rparsing log, completed traces ::  57%|#####7    | 18002/31509 [00:32<00:20, 674.12it/s]","\rparsing log, completed traces ::  57%|#####7    | 18070/31509 [00:33<01:07, 197.90it/s]","\rparsing log, completed traces ::  58%|#####7    | 18138/31509 [00:33<00:53, 250.59it/s]","\rparsing log, completed traces ::  58%|#####7    | 18204/31509 [00:33<00:43, 305.29it/s]","\rparsing log, completed traces ::  58%|#####7    | 18274/31509 [00:34<00:35, 368.95it/s]","\rparsing log, completed traces ::  58%|#####8    | 18337/31509 [00:34<00:31, 417.74it/s]","\rparsing log, completed traces ::  58%|#####8    | 18403/31509 [00:34<00:27, 468.80it/s]","\rparsing log, completed traces ::  59%|#####8    | 18474/31509 [00:34<00:24, 524.00it/s]","\rparsing log, completed traces ::  59%|#####8    | 18540/31509 [00:34<00:23, 551.13it/s]","\rparsing log, completed traces ::  59%|#####9    | 18605/31509 [00:34<00:22, 574.64it/s]","\rparsing log, completed traces ::  59%|#####9    | 18685/31509 [00:34<00:20, 632.39it/s]","\rparsing log, completed traces ::  60%|#####9    | 18761/31509 [00:34<00:19, 667.16it/s]","\rparsing log, completed traces ::  60%|#####9    | 18832/31509 [00:34<00:18, 675.21it/s]","\rparsing log, completed traces ::  60%|######    | 18911/31509 [00:34<00:17, 705.42it/s]","\rparsing log, completed traces ::  60%|######    | 18984/31509 [00:35<00:17, 706.49it/s]","\rparsing log, completed traces ::  60%|######    | 19057/31509 [00:35<00:17, 709.83it/s]","\rparsing log, completed traces ::  61%|######    | 19130/31509 [00:35<00:17, 715.37it/s]","\rparsing log, completed traces ::  61%|######    | 19203/31509 [00:35<00:17, 697.13it/s]","\rparsing log, completed traces ::  61%|######1   | 19274/31509 [00:35<00:17, 688.75it/s]","\rparsing log, completed traces ::  61%|######1   | 19344/31509 [00:35<00:17, 689.80it/s]","\rparsing log, completed traces ::  62%|######1   | 19416/31509 [00:35<00:17, 698.15it/s]","\rparsing log, completed traces ::  62%|######1   | 19487/31509 [00:35<00:17, 697.06it/s]","\rparsing log, completed traces ::  62%|######2   | 19559/31509 [00:35<00:16, 703.17it/s]","\rparsing log, completed traces ::  62%|######2   | 19630/31509 [00:35<00:17, 689.55it/s]","\rparsing log, completed traces ::  63%|######2   | 19700/31509 [00:36<00:17, 670.39it/s]","\rparsing log, completed traces ::  63%|######2   | 19768/31509 [00:36<00:17, 661.73it/s]","\rparsing log, completed traces ::  63%|######2   | 19835/31509 [00:36<00:17, 661.60it/s]","\rparsing log, completed traces ::  63%|######3   | 19902/31509 [00:36<00:17, 647.73it/s]","\rparsing log, completed traces ::  63%|######3   | 19969/31509 [00:36<00:17, 654.08it/s]","\rparsing log, completed traces ::  64%|######3   | 20035/31509 [00:36<00:17, 655.29it/s]","\rparsing log, completed traces ::  64%|######3   | 20101/31509 [00:36<00:17, 646.81it/s]","\rparsing log, completed traces ::  64%|######4   | 20168/31509 [00:36<00:17, 652.74it/s]","\rparsing log, completed traces ::  64%|######4   | 20240/31509 [00:36<00:16, 669.09it/s]","\rparsing log, completed traces ::  64%|######4   | 20312/31509 [00:37<00:16, 680.63it/s]","\rparsing log, completed traces ::  65%|######4   | 20381/31509 [00:37<00:16, 678.16it/s]","\rparsing log, completed traces ::  65%|######4   | 20458/31509 [00:37<00:15, 702.02it/s]","\rparsing log, completed traces ::  65%|######5   | 20529/31509 [00:37<00:15, 702.06it/s]","\rparsing log, completed traces ::  65%|######5   | 20601/31509 [00:37<00:15, 704.98it/s]","\rparsing log, completed traces ::  66%|######5   | 20673/31509 [00:37<00:15, 708.11it/s]","\rparsing log, completed traces ::  66%|######5   | 20746/31509 [00:37<00:15, 713.95it/s]","\rparsing log, completed traces ::  66%|######6   | 20818/31509 [00:37<00:15, 705.73it/s]","\rparsing log, completed traces ::  66%|######6   | 20889/31509 [00:37<00:15, 689.00it/s]","\rparsing log, completed traces ::  67%|######6   | 20958/31509 [00:37<00:15, 674.07it/s]","\rparsing log, completed traces ::  67%|######6   | 21026/31509 [00:38<00:15, 668.74it/s]","\rparsing log, completed traces ::  67%|######6   | 21093/31509 [00:38<00:15, 662.68it/s]","\rparsing log, completed traces ::  67%|######7   | 21160/31509 [00:38<00:15, 657.76it/s]","\rparsing log, completed traces ::  67%|######7   | 21232/31509 [00:38<00:15, 673.81it/s]","\rparsing log, completed traces ::  68%|######7   | 21300/31509 [00:38<00:15, 670.38it/s]","\rparsing log, completed traces ::  68%|######7   | 21368/31509 [00:38<00:15, 670.66it/s]","\rparsing log, completed traces ::  68%|######8   | 21440/31509 [00:38<00:14, 682.19it/s]","\rparsing log, completed traces ::  68%|######8   | 21509/31509 [00:39<00:52, 189.08it/s]","\rparsing log, completed traces ::  68%|######8   | 21580/31509 [00:39<00:40, 243.41it/s]","\rparsing log, completed traces ::  69%|######8   | 21645/31509 [00:39<00:33, 295.96it/s]","\rparsing log, completed traces ::  69%|######8   | 21714/31509 [00:39<00:27, 357.41it/s]","\rparsing log, completed traces ::  69%|######9   | 21786/31509 [00:40<00:22, 422.94it/s]","\rparsing log, completed traces ::  69%|######9   | 21858/31509 [00:40<00:19, 484.04it/s]","\rparsing log, completed traces ::  70%|######9   | 21929/31509 [00:40<00:17, 534.83it/s]","\rparsing log, completed traces ::  70%|######9   | 21999/31509 [00:40<00:16, 574.96it/s]","\rparsing log, completed traces ::  70%|#######   | 22071/31509 [00:40<00:15, 612.23it/s]","\rparsing log, completed traces ::  70%|#######   | 22143/31509 [00:40<00:14, 639.52it/s]","\rparsing log, completed traces ::  71%|#######   | 22214/31509 [00:40<00:14, 650.89it/s]","\rparsing log, completed traces ::  71%|#######   | 22284/31509 [00:40<00:13, 663.56it/s]","\rparsing log, completed traces ::  71%|#######   | 22354/31509 [00:40<00:13, 663.85it/s]","\rparsing log, completed traces ::  71%|#######1  | 22429/31509 [00:40<00:13, 686.98it/s]","\rparsing log, completed traces ::  71%|#######1  | 22502/31509 [00:41<00:12, 697.32it/s]","\rparsing log, completed traces ::  72%|#######1  | 22573/31509 [00:41<00:12, 689.26it/s]","\rparsing log, completed traces ::  72%|#######1  | 22643/31509 [00:41<00:12, 691.90it/s]","\rparsing log, completed traces ::  72%|#######2  | 22713/31509 [00:41<00:12, 693.66it/s]","\rparsing log, completed traces ::  72%|#######2  | 22785/31509 [00:41<00:12, 699.83it/s]","\rparsing log, completed traces ::  73%|#######2  | 22856/31509 [00:41<00:12, 697.63it/s]","\rparsing log, completed traces ::  73%|#######2  | 22926/31509 [00:41<00:12, 675.28it/s]","\rparsing log, completed traces ::  73%|#######2  | 22994/31509 [00:41<00:12, 672.19it/s]","\rparsing log, completed traces ::  73%|#######3  | 23062/31509 [00:41<00:12, 673.67it/s]","\rparsing log, completed traces ::  73%|#######3  | 23130/31509 [00:41<00:12, 665.84it/s]","\rparsing log, completed traces ::  74%|#######3  | 23197/31509 [00:42<00:12, 660.91it/s]","\rparsing log, completed traces ::  74%|#######3  | 23264/31509 [00:42<00:12, 659.36it/s]","\rparsing log, completed traces ::  74%|#######4  | 23330/31509 [00:42<00:12, 651.77it/s]","\rparsing log, completed traces ::  74%|#######4  | 23396/31509 [00:42<00:12, 649.84it/s]","\rparsing log, completed traces ::  74%|#######4  | 23463/31509 [00:42<00:12, 653.95it/s]","\rparsing log, completed traces ::  75%|#######4  | 23531/31509 [00:42<00:12, 658.71it/s]","\rparsing log, completed traces ::  75%|#######4  | 23601/31509 [00:42<00:11, 668.28it/s]","\rparsing log, completed traces ::  75%|#######5  | 23669/31509 [00:42<00:11, 670.06it/s]","\rparsing log, completed traces ::  75%|#######5  | 23739/31509 [00:42<00:11, 675.97it/s]","\rparsing log, completed traces ::  76%|#######5  | 23807/31509 [00:43<00:11, 673.68it/s]","\rparsing log, completed traces ::  76%|#######5  | 23875/31509 [00:43<00:11, 675.48it/s]","\rparsing log, completed traces ::  76%|#######5  | 23943/31509 [00:43<00:11, 668.12it/s]","\rparsing log, completed traces ::  76%|#######6  | 24010/31509 [00:43<00:11, 663.12it/s]","\rparsing log, completed traces ::  76%|#######6  | 24078/31509 [00:43<00:11, 665.34it/s]","\rparsing log, completed traces ::  77%|#######6  | 24146/31509 [00:43<00:11, 666.99it/s]","\rparsing log, completed traces ::  77%|#######6  | 24213/31509 [00:43<00:10, 666.52it/s]","\rparsing log, completed traces ::  77%|#######7  | 24280/31509 [00:43<00:10, 665.56it/s]","\rparsing log, completed traces ::  77%|#######7  | 24353/31509 [00:43<00:10, 683.98it/s]","\rparsing log, completed traces ::  78%|#######7  | 24422/31509 [00:43<00:10, 657.95it/s]","\rparsing log, completed traces ::  78%|#######7  | 24494/31509 [00:44<00:10, 675.91it/s]","\rparsing log, completed traces ::  78%|#######7  | 24562/31509 [00:44<00:10, 675.29it/s]","\rparsing log, completed traces ::  78%|#######8  | 24639/31509 [00:44<00:09, 701.84it/s]","\rparsing log, completed traces ::  78%|#######8  | 24710/31509 [00:44<00:09, 688.54it/s]","\rparsing log, completed traces ::  79%|#######8  | 24780/31509 [00:44<00:09, 683.95it/s]","\rparsing log, completed traces ::  79%|#######8  | 24850/31509 [00:44<00:09, 688.07it/s]","\rparsing log, completed traces ::  79%|#######9  | 24922/31509 [00:44<00:09, 696.26it/s]","\rparsing log, completed traces ::  79%|#######9  | 24998/31509 [00:44<00:09, 712.23it/s]","\rparsing log, completed traces ::  80%|#######9  | 25070/31509 [00:44<00:09, 674.18it/s]","\rparsing log, completed traces ::  80%|#######9  | 25139/31509 [00:44<00:09, 677.78it/s]","\rparsing log, completed traces ::  80%|########  | 25211/31509 [00:45<00:09, 686.97it/s]","\rparsing log, completed traces ::  80%|########  | 25280/31509 [00:45<00:09, 669.00it/s]","\rparsing log, completed traces ::  80%|########  | 25348/31509 [00:45<00:09, 650.88it/s]","\rparsing log, completed traces ::  81%|########  | 25414/31509 [00:46<00:35, 173.22it/s]","\rparsing log, completed traces ::  81%|########  | 25481/31509 [00:46<00:27, 221.42it/s]","\rparsing log, completed traces ::  81%|########1 | 25548/31509 [00:46<00:21, 276.12it/s]","\rparsing log, completed traces ::  81%|########1 | 25617/31509 [00:46<00:17, 336.46it/s]","\rparsing log, completed traces ::  82%|########1 | 25684/31509 [00:46<00:14, 394.40it/s]","\rparsing log, completed traces ::  82%|########1 | 25753/31509 [00:46<00:12, 451.54it/s]","\rparsing log, completed traces ::  82%|########1 | 25818/31509 [00:46<00:11, 494.86it/s]","\rparsing log, completed traces ::  82%|########2 | 25886/31509 [00:47<00:10, 538.53it/s]","\rparsing log, completed traces ::  82%|########2 | 25953/31509 [00:47<00:09, 570.72it/s]","\rparsing log, completed traces ::  83%|########2 | 26019/31509 [00:47<00:09, 586.21it/s]","\rparsing log, completed traces ::  83%|########2 | 26084/31509 [00:47<00:09, 600.64it/s]","\rparsing log, completed traces ::  83%|########3 | 26154/31509 [00:47<00:08, 625.54it/s]","\rparsing log, completed traces ::  83%|########3 | 26223/31509 [00:47<00:08, 643.63it/s]","\rparsing log, completed traces ::  83%|########3 | 26293/31509 [00:47<00:07, 658.74it/s]","\rparsing log, completed traces ::  84%|########3 | 26364/31509 [00:47<00:07, 670.58it/s]","\rparsing log, completed traces ::  84%|########3 | 26433/31509 [00:47<00:07, 667.97it/s]","\rparsing log, completed traces ::  84%|########4 | 26501/31509 [00:48<00:07, 649.65it/s]","\rparsing log, completed traces ::  84%|########4 | 26567/31509 [00:48<00:07, 649.28it/s]","\rparsing log, completed traces ::  85%|########4 | 26633/31509 [00:48<00:07, 643.42it/s]","\rparsing log, completed traces ::  85%|########4 | 26698/31509 [00:48<00:07, 639.84it/s]","\rparsing log, completed traces ::  85%|########4 | 26769/31509 [00:48<00:07, 659.29it/s]","\rparsing log, completed traces ::  85%|########5 | 26836/31509 [00:48<00:07, 658.85it/s]","\rparsing log, completed traces ::  85%|########5 | 26903/31509 [00:48<00:07, 646.54it/s]","\rparsing log, completed traces ::  86%|########5 | 26968/31509 [00:48<00:07, 645.93it/s]","\rparsing log, completed traces ::  86%|########5 | 27033/31509 [00:48<00:07, 632.07it/s]","\rparsing log, completed traces ::  86%|########6 | 27100/31509 [00:48<00:06, 640.37it/s]","\rparsing log, completed traces ::  86%|########6 | 27171/31509 [00:49<00:06, 659.59it/s]","\rparsing log, completed traces ::  86%|########6 | 27240/31509 [00:49<00:06, 665.66it/s]","\rparsing log, completed traces ::  87%|########6 | 27307/31509 [00:49<00:06, 655.37it/s]","\rparsing log, completed traces ::  87%|########6 | 27373/31509 [00:49<00:06, 654.13it/s]","\rparsing log, completed traces ::  87%|########7 | 27440/31509 [00:49<00:06, 657.72it/s]","\rparsing log, completed traces ::  87%|########7 | 27506/31509 [00:49<00:06, 653.63it/s]","\rparsing log, completed traces ::  88%|########7 | 27576/31509 [00:49<00:05, 666.00it/s]","\rparsing log, completed traces ::  88%|########7 | 27645/31509 [00:49<00:05, 669.35it/s]","\rparsing log, completed traces ::  88%|########7 | 27715/31509 [00:49<00:05, 678.18it/s]","\rparsing log, completed traces ::  88%|########8 | 27786/31509 [00:49<00:05, 687.48it/s]","\rparsing log, completed traces ::  88%|########8 | 27855/31509 [00:50<00:05, 676.88it/s]","\rparsing log, completed traces ::  89%|########8 | 27923/31509 [00:50<00:05, 672.11it/s]","\rparsing log, completed traces ::  89%|########8 | 27991/31509 [00:50<00:05, 657.29it/s]","\rparsing log, completed traces ::  89%|########9 | 28059/31509 [00:50<00:05, 661.36it/s]","\rparsing log, completed traces ::  89%|########9 | 28126/31509 [00:50<00:05, 652.65it/s]","\rparsing log, completed traces ::  89%|########9 | 28192/31509 [00:50<00:05, 650.12it/s]","\rparsing log, completed traces ::  90%|########9 | 28263/31509 [00:50<00:04, 666.25it/s]","\rparsing log, completed traces ::  90%|########9 | 28330/31509 [00:50<00:04, 649.21it/s]","\rparsing log, completed traces ::  90%|######### | 28399/31509 [00:50<00:04, 659.00it/s]","\rparsing log, completed traces ::  90%|######### | 28466/31509 [00:50<00:04, 660.58it/s]","\rparsing log, completed traces ::  91%|######### | 28534/31509 [00:51<00:04, 663.17it/s]","\rparsing log, completed traces ::  91%|######### | 28606/31509 [00:51<00:04, 678.94it/s]","\rparsing log, completed traces ::  91%|#########1| 28674/31509 [00:51<00:04, 669.23it/s]","\rparsing log, completed traces ::  91%|#########1| 28741/31509 [00:51<00:04, 635.08it/s]","\rparsing log, completed traces ::  91%|#########1| 28805/31509 [00:51<00:04, 630.65it/s]","\rparsing log, completed traces ::  92%|#########1| 28869/31509 [00:51<00:04, 619.28it/s]","\rparsing log, completed traces ::  92%|#########1| 28933/31509 [00:51<00:04, 624.55it/s]","\rparsing log, completed traces ::  92%|#########2| 29003/31509 [00:51<00:03, 644.12it/s]","\rparsing log, completed traces ::  92%|#########2| 29068/31509 [00:51<00:03, 628.12it/s]","\rparsing log, completed traces ::  92%|#########2| 29133/31509 [00:52<00:03, 631.26it/s]","\rparsing log, completed traces ::  93%|#########2| 29202/31509 [00:52<00:03, 646.47it/s]","\rparsing log, completed traces ::  93%|#########2| 29268/31509 [00:52<00:03, 645.22it/s]","\rparsing log, completed traces ::  93%|#########3| 29334/31509 [00:52<00:03, 645.96it/s]","\rparsing log, completed traces ::  93%|#########3| 29399/31509 [00:52<00:03, 631.32it/s]","\rparsing log, completed traces ::  94%|#########3| 29463/31509 [00:52<00:03, 622.42it/s]","\rparsing log, completed traces ::  94%|#########3| 29526/31509 [00:53<00:13, 148.38it/s]","\rparsing log, completed traces ::  94%|#########3| 29589/31509 [00:53<00:10, 191.31it/s]","\rparsing log, completed traces ::  94%|#########4| 29659/31509 [00:53<00:07, 248.88it/s]","\rparsing log, completed traces ::  94%|#########4| 29726/31509 [00:54<00:05, 306.35it/s]","\rparsing log, completed traces ::  95%|#########4| 29787/31509 [00:54<00:04, 356.54it/s]","\rparsing log, completed traces ::  95%|#########4| 29851/31509 [00:54<00:04, 409.59it/s]","\rparsing log, completed traces ::  95%|#########4| 29917/31509 [00:54<00:03, 462.75it/s]","\rparsing log, completed traces ::  95%|#########5| 29984/31509 [00:54<00:02, 510.34it/s]","\rparsing log, completed traces ::  95%|#########5| 30048/31509 [00:54<00:02, 539.88it/s]","\rparsing log, completed traces ::  96%|#########5| 30115/31509 [00:54<00:02, 572.85it/s]","\rparsing log, completed traces ::  96%|#########5| 30180/31509 [00:54<00:02, 592.33it/s]","\rparsing log, completed traces ::  96%|#########6| 30249/31509 [00:54<00:02, 617.27it/s]","\rparsing log, completed traces ::  96%|#########6| 30315/31509 [00:54<00:01, 626.50it/s]","\rparsing log, completed traces ::  96%|#########6| 30383/31509 [00:55<00:01, 641.52it/s]","\rparsing log, completed traces ::  97%|#########6| 30450/31509 [00:55<00:01, 642.61it/s]","\rparsing log, completed traces ::  97%|#########6| 30516/31509 [00:55<00:01, 645.39it/s]","\rparsing log, completed traces ::  97%|#########7| 30591/31509 [00:55<00:01, 672.72it/s]","\rparsing log, completed traces ::  97%|#########7| 30659/31509 [00:55<00:01, 665.82it/s]","\rparsing log, completed traces ::  98%|#########7| 30727/31509 [00:55<00:01, 663.87it/s]","\rparsing log, completed traces ::  98%|#########7| 30794/31509 [00:55<00:01, 662.79it/s]","\rparsing log, completed traces ::  98%|#########7| 30862/31509 [00:55<00:00, 667.58it/s]","\rparsing log, completed traces ::  98%|#########8| 30929/31509 [00:55<00:00, 660.06it/s]","\rparsing log, completed traces ::  98%|#########8| 30997/31509 [00:56<00:00, 664.67it/s]","\rparsing log, completed traces ::  99%|#########8| 31065/31509 [00:56<00:00, 667.16it/s]","\rparsing log, completed traces ::  99%|#########8| 31137/31509 [00:56<00:00, 678.61it/s]","\rparsing log, completed traces ::  99%|#########9| 31210/31509 [00:56<00:00, 693.46it/s]","\rparsing log, completed traces ::  99%|#########9| 31280/31509 [00:56<00:00, 646.20it/s]","\rparsing log, completed traces ::  99%|#########9| 31346/31509 [00:56<00:00, 637.48it/s]","\rparsing log, completed traces :: 100%|#########9| 31414/31509 [00:56<00:00, 647.92it/s]","\rparsing log, completed traces :: 100%|#########9| 31480/31509 [00:56<00:00, 644.77it/s]","","\rparsing log, completed traces :: 100%|##########| 31509/31509 [00:56<00:00, 554.81it/s]","\n","[data] Loaded BPI2017: events=1202267, cases=31509","\n","[data] Loading XES: /workspace/data/Road_Traffic_Fine_Management_Process.xes","\n","\rparsing log, completed traces ::   0%|          | 0/150370 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 668/150370 [00:00<00:22, 6649.99it/s]","\rparsing log, completed traces ::   1%|          | 1438/150370 [00:00<00:20, 7237.10it/s]","\rparsing log, completed traces ::   1%|1         | 2196/150370 [00:00<00:20, 7392.91it/s]","\rparsing log, completed traces ::   2%|1         | 2954/150370 [00:00<00:19, 7464.53it/s]","\rparsing log, completed traces ::   2%|2         | 3701/150370 [00:00<00:19, 7431.62it/s]","\rparsing log, completed traces ::   3%|2         | 4452/150370 [00:00<00:19, 7457.92it/s]","\rparsing log, completed traces ::   3%|3         | 5202/150370 [00:00<00:19, 7447.83it/s]","\rparsing log, completed traces ::   4%|3         | 5958/150370 [00:00<00:19, 7481.28it/s]","\rparsing log, completed traces ::   4%|4         | 6707/150370 [00:00<00:19, 7470.97it/s]","\rparsing log, completed traces ::   5%|4         | 7455/150370 [00:01<00:36, 3950.96it/s]","\rparsing log, completed traces ::   5%|5         | 8243/150370 [00:01<00:30, 4691.63it/s]","\rparsing log, completed traces ::   6%|6         | 9047/150370 [00:01<00:26, 5391.97it/s]","\rparsing log, completed traces ::   7%|6         | 9826/150370 [00:01<00:23, 5947.37it/s]","\rparsing log, completed traces ::   7%|7         | 10590/150370 [00:01<00:21, 6368.11it/s]","\rparsing log, completed traces ::   8%|7         | 11320/150370 [00:01<00:21, 6603.36it/s]","\rparsing log, completed traces ::   8%|8         | 12071/150370 [00:01<00:20, 6849.76it/s]","\rparsing log, completed traces ::   9%|8         | 12807/150370 [00:01<00:19, 6992.29it/s]","\rparsing log, completed traces ::   9%|9         | 13565/150370 [00:02<00:19, 7158.38it/s]","\rparsing log, completed traces ::  10%|9         | 14308/150370 [00:02<00:18, 7232.27it/s]","\rparsing log, completed traces ::  10%|#         | 15089/150370 [00:02<00:18, 7400.58it/s]","\rparsing log, completed traces ::  11%|#         | 15875/150370 [00:02<00:17, 7507.05it/s]","\rparsing log, completed traces ::  11%|#1        | 16679/150370 [00:02<00:17, 7664.10it/s]","\rparsing log, completed traces ::  12%|#1        | 17474/150370 [00:02<00:17, 7747.61it/s]","\rparsing log, completed traces ::  12%|#2        | 18254/150370 [00:02<00:17, 7732.44it/s]","\rparsing log, completed traces ::  13%|#2        | 19031/150370 [00:03<00:33, 3884.03it/s]","\rparsing log, completed traces ::  13%|#3        | 19790/150370 [00:03<00:28, 4534.41it/s]","\rparsing log, completed traces ::  14%|#3        | 20564/150370 [00:03<00:25, 5176.70it/s]","\rparsing log, completed traces ::  14%|#4        | 21384/150370 [00:03<00:22, 5849.76it/s]","\rparsing log, completed traces ::  15%|#4        | 22201/150370 [00:03<00:19, 6409.58it/s]","\rparsing log, completed traces ::  15%|#5        | 23022/150370 [00:03<00:18, 6870.45it/s]","\rparsing log, completed traces ::  16%|#5        | 23799/150370 [00:03<00:17, 7108.17it/s]","\rparsing log, completed traces ::  16%|#6        | 24573/150370 [00:03<00:18, 6779.21it/s]","\rparsing log, completed traces ::  17%|#6        | 25298/150370 [00:03<00:18, 6663.54it/s]","\rparsing log, completed traces ::  17%|#7        | 25997/150370 [00:04<00:18, 6563.06it/s]","\rparsing log, completed traces ::  18%|#7        | 26676/150370 [00:04<00:19, 6435.04it/s]","\rparsing log, completed traces ::  18%|#8        | 27335/150370 [00:04<00:19, 6405.90it/s]","\rparsing log, completed traces ::  19%|#8        | 27987/150370 [00:04<00:19, 6383.26it/s]","\rparsing log, completed traces ::  19%|#9        | 28784/150370 [00:04<00:17, 6833.46it/s]","\rparsing log, completed traces ::  20%|#9        | 29604/150370 [00:04<00:16, 7226.96it/s]","\rparsing log, completed traces ::  20%|##        | 30334/150370 [00:04<00:16, 7196.94it/s]","\rparsing log, completed traces ::  21%|##        | 31059/150370 [00:04<00:16, 7147.62it/s]","\rparsing log, completed traces ::  21%|##1       | 31778/150370 [00:05<00:34, 3393.89it/s]","\rparsing log, completed traces ::  22%|##1       | 32436/150370 [00:05<00:30, 3915.87it/s]","\rparsing log, completed traces ::  22%|##2       | 33091/150370 [00:05<00:26, 4418.93it/s]","\rparsing log, completed traces ::  22%|##2       | 33760/150370 [00:05<00:23, 4905.83it/s]","\rparsing log, completed traces ::  23%|##2       | 34416/150370 [00:05<00:21, 5293.67it/s]","\rparsing log, completed traces ::  23%|##3       | 35069/150370 [00:05<00:20, 5601.96it/s]","\rparsing log, completed traces ::  24%|##3       | 35730/150370 [00:05<00:19, 5866.47it/s]","\rparsing log, completed traces ::  24%|##4       | 36393/150370 [00:05<00:18, 6074.60it/s]","\rparsing log, completed traces ::  25%|##4       | 37060/150370 [00:06<00:18, 6241.54it/s]","\rparsing log, completed traces ::  25%|##5       | 37723/150370 [00:06<00:17, 6340.72it/s]","\rparsing log, completed traces ::  26%|##5       | 38413/150370 [00:06<00:17, 6502.25it/s]","\rparsing log, completed traces ::  26%|##6       | 39110/150370 [00:06<00:16, 6638.79it/s]","\rparsing log, completed traces ::  26%|##6       | 39811/150370 [00:06<00:16, 6746.87it/s]","\rparsing log, completed traces ::  27%|##6       | 40497/150370 [00:06<00:16, 6769.08it/s]","\rparsing log, completed traces ::  27%|##7       | 41218/150370 [00:06<00:15, 6869.44it/s]","\rparsing log, completed traces ::  28%|##7       | 41963/150370 [00:06<00:15, 7022.64it/s]","\rparsing log, completed traces ::  28%|##8       | 42687/150370 [00:06<00:15, 7085.26it/s]","\rparsing log, completed traces ::  29%|##8       | 43408/150370 [00:06<00:15, 7120.64it/s]","\rparsing log, completed traces ::  29%|##9       | 44122/150370 [00:07<00:14, 7099.23it/s]","\rparsing log, completed traces ::  30%|##9       | 44833/150370 [00:07<00:34, 3087.83it/s]","\rparsing log, completed traces ::  30%|###       | 45527/150370 [00:07<00:28, 3689.59it/s]","\rparsing log, completed traces ::  31%|###       | 46212/150370 [00:07<00:24, 4264.96it/s]","\rparsing log, completed traces ::  31%|###1      | 46901/150370 [00:07<00:21, 4804.21it/s]","\rparsing log, completed traces ::  32%|###1      | 47577/150370 [00:08<00:19, 5249.65it/s]","\rparsing log, completed traces ::  32%|###2      | 48301/150370 [00:08<00:17, 5737.36it/s]","\rparsing log, completed traces ::  33%|###2      | 49123/150370 [00:08<00:15, 6381.72it/s]","\rparsing log, completed traces ::  33%|###3      | 49844/150370 [00:08<00:15, 6605.19it/s]","\rparsing log, completed traces ::  34%|###3      | 50562/150370 [00:08<00:14, 6657.91it/s]","\rparsing log, completed traces ::  34%|###4      | 51274/150370 [00:08<00:14, 6787.12it/s]","\rparsing log, completed traces ::  35%|###4      | 51988/150370 [00:08<00:14, 6887.99it/s]","\rparsing log, completed traces ::  35%|###5      | 52698/150370 [00:08<00:14, 6948.33it/s]","\rparsing log, completed traces ::  36%|###5      | 53408/150370 [00:08<00:13, 6985.53it/s]","\rparsing log, completed traces ::  36%|###6      | 54137/150370 [00:08<00:13, 7072.47it/s]","\rparsing log, completed traces ::  37%|###6      | 54928/150370 [00:09<00:13, 7318.56it/s]","\rparsing log, completed traces ::  37%|###7      | 55666/150370 [00:09<00:12, 7322.95it/s]","\rparsing log, completed traces ::  38%|###7      | 56445/150370 [00:09<00:12, 7461.56it/s]","\rparsing log, completed traces ::  38%|###8      | 57212/150370 [00:09<00:12, 7523.07it/s]","\rparsing log, completed traces ::  39%|###8      | 57967/150370 [00:09<00:12, 7517.26it/s]","\rparsing log, completed traces ::  39%|###9      | 58721/150370 [00:09<00:12, 7475.13it/s]","\rparsing log, completed traces ::  40%|###9      | 59470/150370 [00:09<00:12, 7438.54it/s]","\rparsing log, completed traces ::  40%|####      | 60234/150370 [00:09<00:12, 7497.29it/s]","\rparsing log, completed traces ::  41%|####      | 61042/150370 [00:09<00:11, 7663.52it/s]","\rparsing log, completed traces ::  41%|####1     | 61809/150370 [00:10<00:28, 3120.60it/s]","\rparsing log, completed traces ::  42%|####1     | 62598/150370 [00:10<00:22, 3825.90it/s]","\rparsing log, completed traces ::  42%|####2     | 63357/150370 [00:10<00:19, 4480.98it/s]","\rparsing log, completed traces ::  43%|####2     | 64130/150370 [00:10<00:16, 5119.47it/s]","\rparsing log, completed traces ::  43%|####3     | 64892/150370 [00:10<00:15, 5658.80it/s]","\rparsing log, completed traces ::  44%|####3     | 65684/150370 [00:10<00:13, 6200.66it/s]","\rparsing log, completed traces ::  44%|####4     | 66486/150370 [00:11<00:12, 6661.76it/s]","\rparsing log, completed traces ::  45%|####4     | 67260/150370 [00:11<00:11, 6947.98it/s]","\rparsing log, completed traces ::  45%|####5     | 68116/150370 [00:11<00:11, 7392.10it/s]","\rparsing log, completed traces ::  46%|####5     | 68934/150370 [00:11<00:10, 7597.22it/s]","\rparsing log, completed traces ::  46%|####6     | 69731/150370 [00:11<00:10, 7617.94it/s]","\rparsing log, completed traces ::  47%|####6     | 70519/150370 [00:11<00:10, 7632.94it/s]","\rparsing log, completed traces ::  47%|####7     | 71301/150370 [00:11<00:10, 7635.30it/s]","\rparsing log, completed traces ::  48%|####7     | 72078/150370 [00:11<00:10, 7595.68it/s]","\rparsing log, completed traces ::  48%|####8     | 72847/150370 [00:11<00:10, 7597.30it/s]","\rparsing log, completed traces ::  49%|####8     | 73613/150370 [00:11<00:10, 7371.65it/s]","\rparsing log, completed traces ::  49%|####9     | 74407/150370 [00:12<00:10, 7530.17it/s]","\rparsing log, completed traces ::  50%|#####     | 75242/150370 [00:12<00:09, 7756.47it/s]","\rparsing log, completed traces ::  51%|#####     | 76030/150370 [00:12<00:09, 7791.54it/s]","\rparsing log, completed traces ::  51%|#####1    | 76841/150370 [00:12<00:09, 7884.47it/s]","\rparsing log, completed traces ::  52%|#####1    | 77632/150370 [00:12<00:09, 7749.28it/s]","\rparsing log, completed traces ::  52%|#####2    | 78409/150370 [00:12<00:09, 7615.20it/s]","\rparsing log, completed traces ::  53%|#####2    | 79173/150370 [00:12<00:09, 7621.68it/s]","\rparsing log, completed traces ::  53%|#####3    | 79937/150370 [00:12<00:09, 7584.13it/s]","\rparsing log, completed traces ::  54%|#####3    | 80697/150370 [00:12<00:09, 7587.26it/s]","\rparsing log, completed traces ::  54%|#####4    | 81457/150370 [00:12<00:09, 7552.67it/s]","\rparsing log, completed traces ::  55%|#####4    | 82213/150370 [00:13<00:24, 2835.91it/s]","\rparsing log, completed traces ::  55%|#####5    | 83032/150370 [00:13<00:18, 3569.92it/s]","\rparsing log, completed traces ::  56%|#####5    | 83802/150370 [00:13<00:15, 4243.46it/s]","\rparsing log, completed traces ::  56%|#####6    | 84558/150370 [00:13<00:13, 4871.27it/s]","\rparsing log, completed traces ::  57%|#####6    | 85314/150370 [00:14<00:11, 5443.24it/s]","\rparsing log, completed traces ::  57%|#####7    | 86081/150370 [00:14<00:10, 5961.72it/s]","\rparsing log, completed traces ::  58%|#####7    | 86846/150370 [00:14<00:09, 6373.72it/s]","\rparsing log, completed traces ::  58%|#####8    | 87637/150370 [00:14<00:09, 6775.79it/s]","\rparsing log, completed traces ::  59%|#####8    | 88432/150370 [00:14<00:08, 7096.11it/s]","\rparsing log, completed traces ::  59%|#####9    | 89200/150370 [00:14<00:08, 7256.32it/s]","\rparsing log, completed traces ::  60%|#####9    | 90005/150370 [00:14<00:08, 7481.12it/s]","\rparsing log, completed traces ::  60%|######    | 90789/150370 [00:14<00:07, 7583.99it/s]","\rparsing log, completed traces ::  61%|######    | 91571/150370 [00:14<00:07, 7652.79it/s]","\rparsing log, completed traces ::  61%|######1   | 92352/150370 [00:14<00:07, 7662.60it/s]","\rparsing log, completed traces ::  62%|######1   | 93129/150370 [00:15<00:07, 7660.15it/s]","\rparsing log, completed traces ::  62%|######2   | 93903/150370 [00:15<00:07, 7603.53it/s]","\rparsing log, completed traces ::  63%|######2   | 94706/150370 [00:15<00:07, 7729.08it/s]","\rparsing log, completed traces ::  64%|######3   | 95490/150370 [00:15<00:07, 7760.34it/s]","\rparsing log, completed traces ::  64%|######4   | 96269/150370 [00:15<00:07, 7715.74it/s]","\rparsing log, completed traces ::  65%|######4   | 97043/150370 [00:15<00:06, 7666.77it/s]","\rparsing log, completed traces ::  65%|######5   | 97812/150370 [00:15<00:06, 7611.88it/s]","\rparsing log, completed traces ::  66%|######5   | 98578/150370 [00:15<00:06, 7613.09it/s]","\rparsing log, completed traces ::  66%|######6   | 99347/150370 [00:15<00:06, 7635.13it/s]","\rparsing log, completed traces ::  67%|######6   | 100112/150370 [00:15<00:06, 7547.49it/s]","\rparsing log, completed traces ::  67%|######7   | 100888/150370 [00:16<00:06, 7593.25it/s]","\rparsing log, completed traces ::  68%|######7   | 101659/150370 [00:16<00:06, 7626.94it/s]","\rparsing log, completed traces ::  68%|######8   | 102423/150370 [00:16<00:06, 7622.05it/s]","\rparsing log, completed traces ::  69%|######8   | 103186/150370 [00:16<00:06, 7575.09it/s]","\rparsing log, completed traces ::  69%|######9   | 103944/150370 [00:16<00:06, 7552.09it/s]","\rparsing log, completed traces ::  70%|######9   | 104700/150370 [00:16<00:06, 7490.42it/s]","\rparsing log, completed traces ::  70%|#######   | 105450/150370 [00:17<00:17, 2522.73it/s]","\rparsing log, completed traces ::  71%|#######   | 106185/150370 [00:17<00:14, 3124.89it/s]","\rparsing log, completed traces ::  71%|#######1  | 106925/150370 [00:17<00:11, 3771.58it/s]","\rparsing log, completed traces ::  72%|#######1  | 107659/150370 [00:17<00:09, 4405.38it/s]","\rparsing log, completed traces ::  72%|#######2  | 108390/150370 [00:17<00:08, 4992.53it/s]","\rparsing log, completed traces ::  73%|#######2  | 109117/150370 [00:17<00:07, 5503.06it/s]","\rparsing log, completed traces ::  73%|#######3  | 109857/150370 [00:17<00:06, 5962.61it/s]","\rparsing log, completed traces ::  74%|#######3  | 110594/150370 [00:18<00:06, 6323.43it/s]","\rparsing log, completed traces ::  74%|#######4  | 111324/150370 [00:18<00:05, 6584.32it/s]","\rparsing log, completed traces ::  75%|#######4  | 112077/150370 [00:18<00:05, 6833.08it/s]","\rparsing log, completed traces ::  75%|#######5  | 112808/150370 [00:18<00:05, 6928.35it/s]","\rparsing log, completed traces ::  76%|#######5  | 113568/150370 [00:18<00:05, 7120.41it/s]","\rparsing log, completed traces ::  76%|#######6  | 114447/150370 [00:18<00:04, 7594.87it/s]","\rparsing log, completed traces ::  77%|#######6  | 115368/150370 [00:18<00:04, 8067.93it/s]","\rparsing log, completed traces ::  77%|#######7  | 116260/150370 [00:18<00:04, 8318.19it/s]","\rparsing log, completed traces ::  78%|#######8  | 117291/150370 [00:18<00:03, 8907.17it/s]","\rparsing log, completed traces ::  79%|#######8  | 118190/150370 [00:18<00:03, 8256.08it/s]","\rparsing log, completed traces ::  79%|#######9  | 119031/150370 [00:19<00:04, 7825.86it/s]","\rparsing log, completed traces ::  80%|#######9  | 119828/150370 [00:19<00:04, 7527.50it/s]","\rparsing log, completed traces ::  80%|########  | 120591/150370 [00:19<00:04, 7361.10it/s]","\rparsing log, completed traces ::  81%|########  | 121334/150370 [00:19<00:04, 7226.82it/s]","\rparsing log, completed traces ::  81%|########1 | 122061/150370 [00:19<00:03, 7107.96it/s]","\rparsing log, completed traces ::  82%|########1 | 122775/150370 [00:19<00:03, 7073.31it/s]","\rparsing log, completed traces ::  82%|########2 | 123484/150370 [00:19<00:03, 7057.65it/s]","\rparsing log, completed traces ::  83%|########2 | 124191/150370 [00:19<00:03, 6995.92it/s]","\rparsing log, completed traces ::  83%|########3 | 124892/150370 [00:19<00:03, 6989.00it/s]","\rparsing log, completed traces ::  84%|########3 | 125607/150370 [00:20<00:03, 7035.26it/s]","\rparsing log, completed traces ::  84%|########4 | 126320/150370 [00:20<00:03, 7039.86it/s]","\rparsing log, completed traces ::  84%|########4 | 127061/150370 [00:20<00:03, 7148.88it/s]","\rparsing log, completed traces ::  85%|########4 | 127777/150370 [00:20<00:03, 7130.05it/s]","\rparsing log, completed traces ::  85%|########5 | 128491/150370 [00:20<00:03, 7115.80it/s]","\rparsing log, completed traces ::  86%|########5 | 129226/150370 [00:20<00:02, 7170.44it/s]","\rparsing log, completed traces ::  86%|########6 | 129946/150370 [00:20<00:02, 7177.13it/s]","\rparsing log, completed traces ::  87%|########6 | 130664/150370 [00:20<00:02, 7142.34it/s]","\rparsing log, completed traces ::  87%|########7 | 131379/150370 [00:21<00:08, 2219.79it/s]","\rparsing log, completed traces ::  88%|########7 | 132211/150370 [00:21<00:06, 2931.86it/s]","\rparsing log, completed traces ::  88%|########8 | 133000/150370 [00:21<00:04, 3637.66it/s]","\rparsing log, completed traces ::  89%|########8 | 133763/150370 [00:21<00:03, 4313.81it/s]","\rparsing log, completed traces ::  89%|########9 | 134477/150370 [00:21<00:03, 4864.11it/s]","\rparsing log, completed traces ::  90%|########9 | 135207/150370 [00:22<00:02, 5394.31it/s]","\rparsing log, completed traces ::  90%|######### | 135917/150370 [00:22<00:02, 5779.25it/s]","\rparsing log, completed traces ::  91%|######### | 136632/150370 [00:22<00:02, 6120.88it/s]","\rparsing log, completed traces ::  91%|#########1| 137341/150370 [00:22<00:02, 6338.21it/s]","\rparsing log, completed traces ::  92%|#########1| 138060/150370 [00:22<00:01, 6570.23it/s]","\rparsing log, completed traces ::  92%|#########2| 138773/150370 [00:22<00:01, 6727.02it/s]","\rparsing log, completed traces ::  93%|#########2| 139494/150370 [00:22<00:01, 6842.10it/s]","\rparsing log, completed traces ::  93%|#########3| 140230/150370 [00:22<00:01, 6991.74it/s]","\rparsing log, completed traces ::  94%|#########3| 140961/150370 [00:22<00:01, 7083.83it/s]","\rparsing log, completed traces ::  94%|#########4| 141707/150370 [00:22<00:01, 7193.48it/s]","\rparsing log, completed traces ::  95%|#########4| 142442/150370 [00:23<00:01, 7239.32it/s]","\rparsing log, completed traces ::  95%|#########5| 143173/150370 [00:23<00:00, 7216.83it/s]","\rparsing log, completed traces ::  96%|#########5| 143909/150370 [00:23<00:00, 7258.33it/s]","\rparsing log, completed traces ::  96%|#########6| 144649/150370 [00:23<00:00, 7299.39it/s]","\rparsing log, completed traces ::  97%|#########6| 145382/150370 [00:23<00:00, 6941.61it/s]","\rparsing log, completed traces ::  97%|#########7| 146082/150370 [00:23<00:00, 6569.50it/s]","\rparsing log, completed traces ::  98%|#########7| 146746/150370 [00:23<00:00, 6364.34it/s]","\rparsing log, completed traces ::  98%|#########8| 147388/150370 [00:23<00:00, 6168.60it/s]","\rparsing log, completed traces ::  98%|#########8| 148009/150370 [00:23<00:00, 6063.37it/s]","\rparsing log, completed traces ::  99%|#########8| 148618/150370 [00:24<00:00, 6068.90it/s]","\rparsing log, completed traces ::  99%|#########9| 149260/150370 [00:24<00:00, 6167.38it/s]","\rparsing log, completed traces :: 100%|#########9| 149944/150370 [00:24<00:00, 6361.40it/s]","","\rparsing log, completed traces :: 100%|##########| 150370/150370 [00:24<00:00, 6182.05it/s]","\n","[data] Loaded ROAD: events=561470, cases=150370","\n","\n=== Dataset: BPI2012 ===","\n","Samples train/val/test: 29636/5381/5419; vocab=23","\n","Epoch 1: validation_loss = 1.0980 | acc=0.7095 | f1=0.3282 | top3=0.9262 | ece=0.1770","\n","Epoch 2: validation_loss = 0.7539 | acc=0.7378 | f1=0.3896 | top3=0.9582 | ece=0.0706","\n","Epoch 3: validation_loss = 0.6663 | acc=0.7478 | f1=0.4131 | top3=0.9682 | ece=0.0452","\n","Epoch 4: validation_loss = 0.6261 | acc=0.7558 | f1=0.4474 | top3=0.9718 | ece=0.0311","\n","Epoch 5: validation_loss = 0.6077 | acc=0.7571 | f1=0.4619 | top3=0.9725 | ece=0.0290","\n","Epoch 6: validation_loss = 0.5936 | acc=0.7614 | f1=0.5000 | top3=0.9755 | ece=0.0297","\n","Epoch 7: validation_loss = 0.5856 | acc=0.7616 | f1=0.4991 | top3=0.9768 | ece=0.0323","\n","Epoch 8: validation_loss = 0.5786 | acc=0.7632 | f1=0.5133 | top3=0.9781 | ece=0.0285","\n","Epoch 9: validation_loss = 0.5752 | acc=0.7647 | f1=0.5106 | top3=0.9781 | ece=0.0379","\n","Epoch 10: validation_loss = 0.5664 | acc=0.7664 | f1=0.5206 | top3=0.9777 | ece=0.0304","\n","Epoch 11: validation_loss = 0.5636 | acc=0.7645 | f1=0.5118 | top3=0.9777 | ece=0.0289","\n","Epoch 12: validation_loss = 0.5643 | acc=0.7649 | f1=0.5188 | top3=0.9783 | ece=0.0237","\n","Epoch 13: validation_loss = 0.5586 | acc=0.7688 | f1=0.5517 | top3=0.9779 | ece=0.0321","\n","Epoch 14: validation_loss = 0.5570 | acc=0.7670 | f1=0.5546 | top3=0.9786 | ece=0.0283","\n","Epoch 15: validation_loss = 0.5549 | acc=0.7690 | f1=0.5572 | top3=0.9786 | ece=0.0291","\n","Epoch 16: validation_loss = 0.5562 | acc=0.7671 | f1=0.5789 | top3=0.9790 | ece=0.0307","\n","Epoch 17: validation_loss = 0.5496 | acc=0.7696 | f1=0.5851 | top3=0.9790 | ece=0.0146","\n","Epoch 18: validation_loss = 0.5517 | acc=0.7673 | f1=0.5810 | top3=0.9792 | ece=0.0243","\n","Epoch 19: validation_loss = 0.5471 | acc=0.7679 | f1=0.5801 | top3=0.9781 | ece=0.0241","\n","Epoch 20: validation_loss = 0.5517 | acc=0.7675 | f1=0.5815 | top3=0.9786 | ece=0.0279","\n","Epoch 21: validation_loss = 0.5494 | acc=0.7686 | f1=0.5883 | top3=0.9788 | ece=0.0232","\n","Epoch 22: validation_loss = 0.5485 | acc=0.7727 | f1=0.5913 | top3=0.9788 | ece=0.0232","\n","Epoch 23: validation_loss = 0.5431 | acc=0.7722 | f1=0.5940 | top3=0.9784 | ece=0.0158","\n","Epoch 24: validation_loss = 0.5473 | acc=0.7701 | f1=0.5888 | top3=0.9783 | ece=0.0275","\n","Epoch 25: validation_loss = 0.5463 | acc=0.7696 | f1=0.5912 | top3=0.9790 | ece=0.0250","\n","Epoch 26: validation_loss = 0.5454 | acc=0.7710 | f1=0.5991 | top3=0.9790 | ece=0.0236","\n","Early stopping (no improvement in 8 epochs).","\n","[BPI2012] Train: loss=0.5508 acc=0.7801 f1=0.6015 top3=0.9777 ece=0.0151","\n","[BPI2012] Val:   loss=0.5517 acc=0.7673 f1=0.5810 top3=0.9792 ece=0.0243","\n","[BPI2012] Test:  loss=0.5593 acc=0.7643 f1=0.5735 top3=0.9815 ece=0.0199","\n","\n=== Dataset: BPI2017 ===","\n","Samples train/val/test: 44965/9464/9455; vocab=24","\n","Epoch 1: validation_loss = 0.7534 | acc=0.7936 | f1=0.5117 | top3=0.9587 | ece=0.1476","\n","Epoch 2: validation_loss = 0.5340 | acc=0.8087 | f1=0.5679 | top3=0.9741 | ece=0.0458","\n","Epoch 3: validation_loss = 0.4883 | acc=0.8146 | f1=0.5711 | top3=0.9790 | ece=0.0303","\n","Epoch 4: validation_loss = 0.4673 | acc=0.8165 | f1=0.5727 | top3=0.9802 | ece=0.0196","\n","Epoch 5: validation_loss = 0.4580 | acc=0.8167 | f1=0.5752 | top3=0.9805 | ece=0.0191","\n","Epoch 6: validation_loss = 0.4524 | acc=0.8152 | f1=0.5867 | top3=0.9805 | ece=0.0221","\n","Epoch 7: validation_loss = 0.4476 | acc=0.8150 | f1=0.5935 | top3=0.9802 | ece=0.0192","\n","Epoch 8: validation_loss = 0.4435 | acc=0.8175 | f1=0.5955 | top3=0.9801 | ece=0.0169","\n","Epoch 9: validation_loss = 0.4398 | acc=0.8197 | f1=0.5978 | top3=0.9800 | ece=0.0125","\n","Epoch 10: validation_loss = 0.4396 | acc=0.8157 | f1=0.5928 | top3=0.9808 | ece=0.0227","\n","Epoch 11: validation_loss = 0.4345 | acc=0.8184 | f1=0.5981 | top3=0.9805 | ece=0.0101","\n","Epoch 12: validation_loss = 0.4359 | acc=0.8166 | f1=0.5920 | top3=0.9810 | ece=0.0199","\n","Epoch 13: validation_loss = 0.4335 | acc=0.8172 | f1=0.5984 | top3=0.9808 | ece=0.0111","\n","Epoch 14: validation_loss = 0.4337 | acc=0.8138 | f1=0.5937 | top3=0.9809 | ece=0.0137","\n","Epoch 15: validation_loss = 0.4298 | acc=0.8189 | f1=0.5980 | top3=0.9815 | ece=0.0102","\n","Epoch 16: validation_loss = 0.4324 | acc=0.8177 | f1=0.5950 | top3=0.9815 | ece=0.0114","\n","Epoch 17: validation_loss = 0.4317 | acc=0.8142 | f1=0.5977 | top3=0.9814 | ece=0.0157","\n","Epoch 18: validation_loss = 0.4303 | acc=0.8183 | f1=0.5968 | top3=0.9817 | ece=0.0114","\n","Epoch 19: validation_loss = 0.4308 | acc=0.8173 | f1=0.5974 | top3=0.9813 | ece=0.0132","\n","Epoch 20: validation_loss = 0.4280 | acc=0.8169 | f1=0.5958 | top3=0.9809 | ece=0.0136","\n","Epoch 21: validation_loss = 0.4298 | acc=0.8179 | f1=0.6095 | top3=0.9809 | ece=0.0125","\n","Epoch 22: validation_loss = 0.4253 | acc=0.8183 | f1=0.6116 | top3=0.9820 | ece=0.0138","\n","Epoch 23: validation_loss = 0.4300 | acc=0.8131 | f1=0.6031 | top3=0.9821 | ece=0.0152","\n","Epoch 24: validation_loss = 0.4273 | acc=0.8180 | f1=0.6112 | top3=0.9817 | ece=0.0120","\n","Epoch 25: validation_loss = 0.4247 | acc=0.8179 | f1=0.6191 | top3=0.9820 | ece=0.0074","\n","Epoch 26: validation_loss = 0.4261 | acc=0.8192 | f1=0.6304 | top3=0.9821 | ece=0.0118","\n","Epoch 27: validation_loss = 0.4242 | acc=0.8204 | f1=0.6294 | top3=0.9825 | ece=0.0099","\n","Epoch 28: validation_loss = 0.4270 | acc=0.8175 | f1=0.6108 | top3=0.9813 | ece=0.0124","\n","Epoch 29: validation_loss = 0.4261 | acc=0.8192 | f1=0.6282 | top3=0.9819 | ece=0.0154","\n","Epoch 30: validation_loss = 0.4280 | acc=0.8175 | f1=0.6132 | top3=0.9820 | ece=0.0108","\n","Epoch 31: validation_loss = 0.4224 | acc=0.8183 | f1=0.6279 | top3=0.9827 | ece=0.0075","\n","Epoch 32: validation_loss = 0.4257 | acc=0.8190 | f1=0.6272 | top3=0.9827 | ece=0.0092","\n","Epoch 33: validation_loss = 0.4215 | acc=0.8186 | f1=0.6301 | top3=0.9825 | ece=0.0090","\n","Epoch 34: validation_loss = 0.4235 | acc=0.8202 | f1=0.6127 | top3=0.9824 | ece=0.0108","\n","Epoch 35: validation_loss = 0.4215 | acc=0.8202 | f1=0.6309 | top3=0.9826 | ece=0.0095","\n","Epoch 36: validation_loss = 0.4213 | acc=0.8182 | f1=0.6288 | top3=0.9829 | ece=0.0089","\n","Epoch 37: validation_loss = 0.4205 | acc=0.8197 | f1=0.6284 | top3=0.9831 | ece=0.0072","\n","Epoch 38: validation_loss = 0.4224 | acc=0.8182 | f1=0.6264 | top3=0.9832 | ece=0.0103","\n","Epoch 39: validation_loss = 0.4234 | acc=0.8226 | f1=0.6334 | top3=0.9822 | ece=0.0125","\n","Epoch 40: validation_loss = 0.4214 | acc=0.8210 | f1=0.6310 | top3=0.9833 | ece=0.0075","\n","[BPI2017] Train: loss=0.4124 acc=0.8256 f1=0.6478 top3=0.9848 ece=0.0058","\n","[BPI2017] Val:   loss=0.4214 acc=0.8210 f1=0.6310 top3=0.9833 ece=0.0075","\n","[BPI2017] Test:  loss=0.4248 acc=0.8287 f1=0.6309 top3=0.9846 ece=0.0114","\n","\n=== Dataset: ROAD ===","\n","Samples train/val/test: 12067/2555/2709; vocab=11","\n","Epoch 1: validation_loss = 1.2671 | acc=0.8423 | f1=0.4058 | top3=0.9523 | ece=0.4908","\n","Epoch 2: validation_loss = 0.5801 | acc=0.8286 | f1=0.4147 | top3=0.9796 | ece=0.1001","\n","Epoch 3: validation_loss = 0.5009 | acc=0.8614 | f1=0.4450 | top3=0.9796 | ece=0.0464","\n","Epoch 4: validation_loss = 0.4707 | acc=0.8614 | f1=0.4449 | top3=0.9824 | ece=0.0234","\n","Epoch 5: validation_loss = 0.4494 | acc=0.8642 | f1=0.4461 | top3=0.9867 | ece=0.0238","\n","Epoch 6: validation_loss = 0.4373 | acc=0.8646 | f1=0.4448 | top3=0.9937 | ece=0.0186","\n","Epoch 7: validation_loss = 0.4278 | acc=0.8646 | f1=0.4449 | top3=0.9937 | ece=0.0167","\n","Epoch 8: validation_loss = 0.4189 | acc=0.8665 | f1=0.4937 | top3=0.9941 | ece=0.0139","\n","Epoch 9: validation_loss = 0.4145 | acc=0.8701 | f1=0.6039 | top3=0.9945 | ece=0.0176","\n","Epoch 10: validation_loss = 0.4118 | acc=0.8720 | f1=0.6543 | top3=0.9969 | ece=0.0245","\n","Epoch 11: validation_loss = 0.4051 | acc=0.8720 | f1=0.6543 | top3=0.9977 | ece=0.0163","\n","Epoch 12: validation_loss = 0.4021 | acc=0.8748 | f1=0.7374 | top3=0.9977 | ece=0.0189","\n","Epoch 13: validation_loss = 0.3998 | acc=0.8748 | f1=0.7374 | top3=0.9996 | ece=0.0201","\n","Epoch 14: validation_loss = 0.3972 | acc=0.8751 | f1=0.7468 | top3=0.9996 | ece=0.0224","\n","Epoch 15: validation_loss = 0.3974 | acc=0.8740 | f1=0.7412 | top3=0.9996 | ece=0.0293","\n","Epoch 16: validation_loss = 0.3918 | acc=0.8751 | f1=0.7468 | top3=0.9996 | ece=0.0151","\n","Epoch 17: validation_loss = 0.3910 | acc=0.8751 | f1=0.7468 | top3=0.9996 | ece=0.0142","\n","Epoch 18: validation_loss = 0.3895 | acc=0.8755 | f1=0.7522 | top3=0.9996 | ece=0.0231","\n","Epoch 19: validation_loss = 0.3889 | acc=0.8767 | f1=0.7696 | top3=0.9996 | ece=0.0183","\n","Epoch 20: validation_loss = 0.3858 | acc=0.8755 | f1=0.7522 | top3=0.9996 | ece=0.0107","\n","Epoch 21: validation_loss = 0.3868 | acc=0.8755 | f1=0.7522 | top3=0.9996 | ece=0.0174","\n","Early stopping (no improvement in 8 epochs).","\n","[ROAD] Train: loss=0.3724 acc=0.8793 f1=0.6480 top3=0.9992 ece=0.0114","\n","[ROAD] Val:   loss=0.3998 acc=0.8748 f1=0.7374 top3=0.9996 ece=0.0201","\n","[ROAD] Test:  loss=0.3549 acc=0.8955 f1=0.7190 top3=0.9993 ece=0.0206","\n","Execution time: 6 minutes seconds (time limit is an hour)."],"parse_metrics_plan":"I will load the consolidated experiment_data.npy from the working directory, parse its nested structure according to the original training code, and extract final metrics for train, validation, and test for each dataset. For clarity, I will print the dataset name first, followed by clearly labeled metrics like \"train accuracy\" and \"validation loss.\" I will also print auxiliary information such as epochs trained and best validation top-3 accuracy. The script executes immediately without any special entry point and avoids creating any plots.","parse_metrics_code":"import os\nimport numpy as np\n\n\ndef load_experiment_data():\n    working_dir = os.path.join(os.getcwd(), \"working\")\n    path = os.path.join(working_dir, \"experiment_data.npy\")\n    if not os.path.exists(path):\n        print(f\"experiment_data.npy not found at: {path}\")\n        return {}\n    try:\n        data = np.load(path, allow_pickle=True).item()\n        if not isinstance(data, dict):\n            print(\"Loaded experiment data is not a dictionary. Printing raw content:\")\n            print(data)\n            return {}\n        return data\n    except Exception as e:\n        print(f\"Failed to load experiment data: {e}\")\n        return {}\n\n\ndef extract_final_metrics(result_dict, split_key):\n    # result_dict[\"metrics\"][split_key] is a list of tuples: (label, metrics_dict)\n    # We want the entry labeled \"final\" if present; else, fallback to last entry\n    try:\n        entries = result_dict.get(\"metrics\", {}).get(split_key, [])\n        final_entry = None\n        for label, metrics in entries:\n            if label == \"final\":\n                final_entry = metrics\n                break\n        if final_entry is None and len(entries) > 0:\n            final_entry = entries[-1][1]\n        return final_entry if isinstance(final_entry, dict) else {}\n    except Exception:\n        return {}\n\n\ndef print_dataset_metrics(name, res):\n    print(f\"Dataset: {name}\")\n\n    train_metrics = extract_final_metrics(res, \"train\")\n    val_metrics = extract_final_metrics(res, \"val\")\n    test_metrics = extract_final_metrics(res, \"test\")\n\n    # Helper to safely format numbers\n    def fmt(v):\n        try:\n            if isinstance(v, (float, int, np.floating, np.integer)):\n                return f\"{float(v):.6f}\"\n            return str(v)\n        except Exception:\n            return str(v)\n\n    # Train metrics\n    if train_metrics:\n        if \"loss\" in train_metrics:\n            print(f\"train loss: {fmt(train_metrics.get('loss'))}\")\n        if \"acc\" in train_metrics:\n            print(f\"train accuracy: {fmt(train_metrics.get('acc'))}\")\n        if \"macro_f1\" in train_metrics:\n            print(f\"train F1 score (macro): {fmt(train_metrics.get('macro_f1'))}\")\n        if \"top3\" in train_metrics:\n            print(f\"train top-3 accuracy: {fmt(train_metrics.get('top3'))}\")\n        if \"ece\" in train_metrics:\n            print(f\"train ECE: {fmt(train_metrics.get('ece'))}\")\n\n    # Validation metrics\n    if val_metrics:\n        if \"loss\" in val_metrics:\n            print(f\"validation loss: {fmt(val_metrics.get('loss'))}\")\n        if \"acc\" in val_metrics:\n            print(f\"validation accuracy: {fmt(val_metrics.get('acc'))}\")\n        if \"macro_f1\" in val_metrics:\n            print(f\"validation F1 score (macro): {fmt(val_metrics.get('macro_f1'))}\")\n        if \"top3\" in val_metrics:\n            print(f\"validation top-3 accuracy: {fmt(val_metrics.get('top3'))}\")\n        if \"ece\" in val_metrics:\n            print(f\"validation ECE: {fmt(val_metrics.get('ece'))}\")\n\n    # Test metrics\n    if test_metrics:\n        if \"loss\" in test_metrics:\n            print(f\"test loss: {fmt(test_metrics.get('loss'))}\")\n        if \"acc\" in test_metrics:\n            print(f\"test accuracy: {fmt(test_metrics.get('acc'))}\")\n        if \"macro_f1\" in test_metrics:\n            print(f\"test F1 score (macro): {fmt(test_metrics.get('macro_f1'))}\")\n        if \"top3\" in test_metrics:\n            print(f\"test top-3 accuracy: {fmt(test_metrics.get('top3'))}\")\n        if \"ece\" in test_metrics:\n            print(f\"test ECE: {fmt(test_metrics.get('ece'))}\")\n\n    # Additional summary info\n    if \"epochs_trained\" in res:\n        print(f\"epochs trained: {fmt(res.get('epochs_trained'))}\")\n    if \"best_val_top3\" in res:\n        print(f\"best validation top-3 accuracy: {fmt(res.get('best_val_top3'))}\")\n    if \"best_epoch\" in res:\n        print(f\"best epoch: {fmt(res.get('best_epoch'))}\")\n\n\ndef main():\n    experiment_data = load_experiment_data()\n    if not experiment_data:\n        print(\"No datasets available in experiment data.\")\n    else:\n        for dataset_name, results in experiment_data.items():\n            try:\n                print_dataset_metrics(dataset_name, results)\n            except Exception as e:\n                print(f\"Failed to process dataset '{dataset_name}': {e}\")\n\n\n# Execute immediately\nmain()\n","parse_term_out":["Dataset: BPI2012","\n","train loss: 0.550781","\n","train accuracy: 0.780099","\n","train F1 score (macro): 0.601468","\n","train top-3 accuracy: 0.977730","\n","train ECE: 0.015108","\n","validation loss: 0.551736","\n","validation accuracy: 0.767329","\n","validation F1 score (macro): 0.581032","\n","validation top-3 accuracy: 0.979186","\n","validation ECE: 0.024318","\n","test loss: 0.559347","\n","test accuracy: 0.764348","\n","test F1 score (macro): 0.573526","\n","test top-3 accuracy: 0.981546","\n","test ECE: 0.019878","\n","epochs trained: 26.000000","\n","best validation top-3 accuracy: 0.979186","\n","best epoch: 18.000000","\n","Dataset: BPI2017","\n","train loss: 0.412368","\n","train accuracy: 0.825575","\n","train F1 score (macro): 0.647785","\n","train top-3 accuracy: 0.984833","\n","train ECE: 0.005811","\n","validation loss: 0.421440","\n","validation accuracy: 0.821006","\n","validation F1 score (macro): 0.631031","\n","validation top-3 accuracy: 0.983305","\n","validation ECE: 0.007509","\n","test loss: 0.424809","\n","test accuracy: 0.828662","\n","test F1 score (macro): 0.630893","\n","test top-3 accuracy: 0.984558","\n","test ECE: 0.011444","\n","epochs trained: 40.000000","\n","best validation top-3 accuracy: 0.983305","\n","best epoch: 40.000000","\n","Dataset: ROAD","\n","train loss: 0.372388","\n","train accuracy: 0.879257","\n","train F1 score (macro): 0.647995","\n","train top-3 accuracy: 0.999171","\n","train ECE: 0.011372","\n","validation loss: 0.399839","\n","validation accuracy: 0.874755","\n","validation F1 score (macro): 0.737367","\n","validation top-3 accuracy: 0.999609","\n","validation ECE: 0.020124","\n","test loss: 0.354950","\n","test accuracy: 0.895533","\n","test F1 score (macro): 0.719046","\n","test top-3 accuracy: 0.999262","\n","test ECE: 0.020564","\n","epochs trained: 21.000000","\n","best validation top-3 accuracy: 0.999609","\n","best epoch: 13.000000","\n","Execution time: a moment seconds (time limit is an hour)."],"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":413.9843521118164,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"","exp_results_dir":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839","metric":{"value":{"metric_names":[{"metric_name":"train loss","lower_is_better":true,"description":"Final training loss after the last epoch.","data":[{"dataset_name":"BPI2012","final_value":0.550781,"best_value":0.550781},{"dataset_name":"BPI2017","final_value":0.412368,"best_value":0.412368},{"dataset_name":"ROAD","final_value":0.372388,"best_value":0.372388}]},{"metric_name":"train accuracy","lower_is_better":false,"description":"Final training accuracy after the last epoch.","data":[{"dataset_name":"BPI2012","final_value":0.780099,"best_value":0.780099},{"dataset_name":"BPI2017","final_value":0.825575,"best_value":0.825575},{"dataset_name":"ROAD","final_value":0.879257,"best_value":0.879257}]},{"metric_name":"train F1 score (macro)","lower_is_better":false,"description":"Final macro-averaged F1 score on the training set.","data":[{"dataset_name":"BPI2012","final_value":0.601468,"best_value":0.601468},{"dataset_name":"BPI2017","final_value":0.647785,"best_value":0.647785},{"dataset_name":"ROAD","final_value":0.647995,"best_value":0.647995}]},{"metric_name":"train top-3 accuracy","lower_is_better":false,"description":"Final training top-3 accuracy.","data":[{"dataset_name":"BPI2012","final_value":0.97773,"best_value":0.97773},{"dataset_name":"BPI2017","final_value":0.984833,"best_value":0.984833},{"dataset_name":"ROAD","final_value":0.999171,"best_value":0.999171}]},{"metric_name":"train ECE","lower_is_better":true,"description":"Final Expected Calibration Error on the training set.","data":[{"dataset_name":"BPI2012","final_value":0.015108,"best_value":0.015108},{"dataset_name":"BPI2017","final_value":0.005811,"best_value":0.005811},{"dataset_name":"ROAD","final_value":0.011372,"best_value":0.011372}]},{"metric_name":"validation loss","lower_is_better":true,"description":"Final validation loss after the last epoch.","data":[{"dataset_name":"BPI2012","final_value":0.551736,"best_value":0.551736},{"dataset_name":"BPI2017","final_value":0.42144,"best_value":0.42144},{"dataset_name":"ROAD","final_value":0.399839,"best_value":0.399839}]},{"metric_name":"validation accuracy","lower_is_better":false,"description":"Final validation accuracy after the last epoch.","data":[{"dataset_name":"BPI2012","final_value":0.767329,"best_value":0.767329},{"dataset_name":"BPI2017","final_value":0.821006,"best_value":0.821006},{"dataset_name":"ROAD","final_value":0.874755,"best_value":0.874755}]},{"metric_name":"validation F1 score (macro)","lower_is_better":false,"description":"Final macro-averaged F1 score on the validation set.","data":[{"dataset_name":"BPI2012","final_value":0.581032,"best_value":0.581032},{"dataset_name":"BPI2017","final_value":0.631031,"best_value":0.631031},{"dataset_name":"ROAD","final_value":0.737367,"best_value":0.737367}]},{"metric_name":"validation top-3 accuracy","lower_is_better":false,"description":"Final and best top-3 accuracy on the validation set.","data":[{"dataset_name":"BPI2012","final_value":0.979186,"best_value":0.979186},{"dataset_name":"BPI2017","final_value":0.983305,"best_value":0.983305},{"dataset_name":"ROAD","final_value":0.999609,"best_value":0.999609}]},{"metric_name":"validation ECE","lower_is_better":true,"description":"Final Expected Calibration Error on the validation set.","data":[{"dataset_name":"BPI2012","final_value":0.024318,"best_value":0.024318},{"dataset_name":"BPI2017","final_value":0.007509,"best_value":0.007509},{"dataset_name":"ROAD","final_value":0.020124,"best_value":0.020124}]},{"metric_name":"test loss","lower_is_better":true,"description":"Final test loss after training.","data":[{"dataset_name":"BPI2012","final_value":0.559347,"best_value":0.559347},{"dataset_name":"BPI2017","final_value":0.424809,"best_value":0.424809},{"dataset_name":"ROAD","final_value":0.35495,"best_value":0.35495}]},{"metric_name":"test accuracy","lower_is_better":false,"description":"Final test accuracy after training.","data":[{"dataset_name":"BPI2012","final_value":0.764348,"best_value":0.764348},{"dataset_name":"BPI2017","final_value":0.828662,"best_value":0.828662},{"dataset_name":"ROAD","final_value":0.895533,"best_value":0.895533}]},{"metric_name":"test F1 score (macro)","lower_is_better":false,"description":"Final macro-averaged F1 score on the test set.","data":[{"dataset_name":"BPI2012","final_value":0.573526,"best_value":0.573526},{"dataset_name":"BPI2017","final_value":0.630893,"best_value":0.630893},{"dataset_name":"ROAD","final_value":0.719046,"best_value":0.719046}]},{"metric_name":"test top-3 accuracy","lower_is_better":false,"description":"Final top-3 accuracy on the test set.","data":[{"dataset_name":"BPI2012","final_value":0.981546,"best_value":0.981546},{"dataset_name":"BPI2017","final_value":0.984558,"best_value":0.984558},{"dataset_name":"ROAD","final_value":0.999262,"best_value":0.999262}]},{"metric_name":"test ECE","lower_is_better":true,"description":"Final Expected Calibration Error on the test set.","data":[{"dataset_name":"BPI2012","final_value":0.019878,"best_value":0.019878},{"dataset_name":"BPI2017","final_value":0.011444,"best_value":0.011444},{"dataset_name":"ROAD","final_value":0.020564,"best_value":0.020564}]},{"metric_name":"epochs trained","lower_is_better":false,"description":"Total number of epochs the model was trained for on this dataset.","data":[{"dataset_name":"BPI2012","final_value":26.0,"best_value":26.0},{"dataset_name":"BPI2017","final_value":40.0,"best_value":40.0},{"dataset_name":"ROAD","final_value":21.0,"best_value":21.0}]},{"metric_name":"best epoch","lower_is_better":false,"description":"Epoch index with the best validation top-3 accuracy.","data":[{"dataset_name":"BPI2012","final_value":18.0,"best_value":18.0},{"dataset_name":"BPI2017","final_value":40.0,"best_value":40.0},{"dataset_name":"ROAD","final_value":13.0,"best_value":13.0}]}]},"maximize":null,"name":null,"description":null},"is_buggy":false,"is_buggy_plots":false,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":["../../logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2012_confusion_matrix.png","../../logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2017_train_val_loss.png","../../logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/ROAD_train_val_loss.png","../../logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2017_val_curves.png","../../logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2017_confusion_matrix.png","../../logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/ROAD_confusion_matrix.png","../../logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2012_val_top3.png","../../logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/ROAD_val_top3.png","../../logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2012_val_curves.png","../../logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2017_val_top3.png","../../logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2012_train_val_loss.png","../../logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/ROAD_val_curves.png"],"plot_paths":["experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2012_confusion_matrix.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2017_train_val_loss.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/ROAD_train_val_loss.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2017_val_curves.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2017_confusion_matrix.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/ROAD_confusion_matrix.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2012_val_top3.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/ROAD_val_top3.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2012_val_curves.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2017_val_top3.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2012_train_val_loss.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/ROAD_val_curves.png"],"plot_analyses":[{"analysis":"The confusion matrix for BPI2012 reveals that the model has a strong ability to accurately predict next activities, as indicated by the pronounced diagonal. However, there are some off-diagonal elements suggesting the model occasionally predicts incorrect activities. This can be seen in the lower intensity of some diagonal elements compared to others, indicating variability in prediction accuracy across different activities.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2012_confusion_matrix.png"},{"analysis":"The training and validation loss curves for BPI2017 show a typical pattern where both losses decrease rapidly during the initial epochs and then stabilize, reflecting convergence. The validation loss closely follows the training loss, suggesting that the model is well-tuned with minimal overfitting. The gap between training and validation loss is small, indicating a good generalization performance.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2017_train_val_loss.png"},{"analysis":"The training and validation loss curves for the ROAD dataset exhibit similar behavior to BPI2017, with both losses decreasing rapidly before leveling off. The small gap between the training and validation loss suggests the model is effectively generalizing to unseen data. However, the ROAD dataset achieves this stabilization in fewer epochs, indicating potentially faster convergence.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/ROAD_train_val_loss.png"},{"analysis":"The validation curves for BPI2017 demonstrate strong performance across different metrics. The accuracy, Macro-F1, and Top-3 accuracy are consistently high, indicating effective prediction capabilities. The Expected Calibration Error (ECE) remains low, suggesting the model's probabilistic predictions are well-calibrated. These metrics reflect a model that not only predicts accurately but also maintains consistent confidence levels.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2017_val_curves.png"},{"analysis":"The BPI2017 confusion matrix shows a strong diagonal, indicating the model's proficiency in predicting next activities accurately. Some off-diagonal values are present, which suggest occasional mispredictions. The concentration of correct predictions across most activities speaks to the model's robust performance.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2017_confusion_matrix.png"},{"analysis":"The confusion matrix for the ROAD dataset indicates that while the model performs well in predicting some activities, there are notable errors, especially in certain activities where off-diagonal values are prominent. This suggests variability in prediction accuracy and may indicate the need for further tuning or data preprocessing for specific activities.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/ROAD_confusion_matrix.png"},{"analysis":"The validation curves for BPI2012 show consistently high performance in accuracy, Macro-F1, and Top-3 accuracy over epochs. The ECE is low, indicating well-calibrated predictions. The model maintains stable performance across epochs, reflecting a robust predictive capability.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2012_val_top3.png"},{"analysis":"The training and validation loss curves for BPI2012 display a typical convergence pattern with both losses decreasing rapidly and stabilizing over epochs. The proximity of the validation loss to the training loss suggests minimal overfitting and effective generalization.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/ROAD_val_top3.png"},{"analysis":"The validation curves for the ROAD dataset indicate strong performance in accuracy, Macro-F1, and Top-3 accuracy, with values consistently increasing across epochs. The ECE remains low, suggesting good calibration of predictions. These curves reflect a model that efficiently handles the prediction task with reliable performance.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2012_val_curves.png"},{"analysis":"The BPI2017 Top-3 validation accuracy curve shows stable and high performance across epochs. The model maintains a top-3 accuracy close to 98%, demonstrating its reliability in predicting the correct activity within the top three options. This consistency over epochs reflects the model's effective learning and predictive ability.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_251df5cdee2b452db709366215875b0a_proc_361839/BPI2017_val_top3.png"}],"vlm_feedback_summary":"The plots received from the experiments provide a comprehensive view of the model's performance across different datasets and metrics. The results highlight the model's strong predictive capabilities, especially in next-activity classification tasks, with consistent high accuracy, Macro-F1, and Top-3 accuracy across different logs. Calibration of predictions is generally well-maintained, as indicated by low ECE values. The loss curves suggest effective convergence and generalization, with minimal overfitting observed. Overall, the experiments show promising results in resource-centric predictive process monitoring, validating the hypothesis and supporting the research goals.","datasets_successfully_tested":["BPI2012","BPI2017","ROAD"],"ablation_name":null,"hyperparam_name":null,"is_seed_node":false,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"import os\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score\nimport random\nimport math\nfrom datetime import datetime\nfrom typing import Dict, List, Tuple\n\n# Try importing pm4py, otherwise create a minimal fallback\ntry:\n    from pm4py.objects.log.importer.xes import importer as xes_importer\n\n    PM4PY_AVAILABLE = True\nexcept Exception:\n    PM4PY_AVAILABLE = False\n\n# Working directory\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\n# Device\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n# Experiment data container following required convention\nexperiment_data = {\n    \"dropout_tuning\": {\n        # dataset_name: filled at runtime\n    }\n}\n\n\n# Reproducibility\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# Utilities: Load datasets using pm4py from local XES (fallback to synthetic if not found)\ndef xes_to_df(log):\n    # Flatten PM4Py event log to pandas DataFrame with required columns\n    rows = []\n    for trace in log:\n        case_id = str(trace.attributes.get(\"concept:name\", \"unknown_case\"))\n        for ev in trace:\n            act = str(ev.get(\"concept:name\", \"UNKNOWN\"))\n            ts = ev.get(\"time:timestamp\", None)\n            lc = str(ev.get(\"lifecycle:transition\", \"complete\"))\n            if ts is None:\n                continue\n            rows.append(\n                {\n                    \"case_id\": case_id,\n                    \"activity\": act,\n                    \"timestamp\": pd.to_datetime(ts),\n                    \"lifecycle\": lc,\n                }\n            )\n    if len(rows) == 0:\n        return pd.DataFrame(columns=[\"case_id\", \"activity\", \"timestamp\", \"lifecycle\"])\n    df = pd.DataFrame(rows)\n    # Ensure required dtypes\n    df[\"case_id\"] = df[\"case_id\"].astype(str)\n    df[\"activity\"] = df[\"activity\"].astype(str)\n    df[\"timestamp\"] = pd.to_datetime(df[\"timestamp\"], utc=True)\n    if \"lifecycle\" in df.columns:\n        df[\"lifecycle\"] = df[\"lifecycle\"].astype(str)\n    return df\n\n\ndef generate_synthetic_df(n_cases=200, max_len=12, n_acts=10):\n    rows = []\n    base_time = pd.Timestamp(\"2020-01-01\", tz=\"UTC\")\n    for c in range(n_cases):\n        cid = f\"C{c:05d}\"\n        length = random.randint(3, max_len)\n        t = base_time + pd.Timedelta(days=random.randint(0, 365))\n        for i in range(length):\n            act = f\"A{random.randint(1, n_acts)}\"\n            t = t + pd.Timedelta(hours=random.randint(1, 48))\n            rows.append(\n                {\n                    \"case_id\": cid,\n                    \"activity\": act,\n                    \"timestamp\": t,\n                    \"lifecycle\": \"complete\",\n                }\n            )\n    df = pd.DataFrame(rows)\n    return df\n\n\ndef load_local_datasets():\n    datasets = {}\n    data_dir = os.path.join(os.getcwd(), \"data\")\n    os.makedirs(data_dir, exist_ok=True)\n    candidates = {\n        \"BPI2012\": [\"BPI_Challenge_2012.xes\", \"BPI2012.xes\"],\n        \"BPI2017\": [\"BPI_Challenge_2017.xes\", \"BPI2017.xes\"],\n        \"ROAD\": [\n            \"road_traffic_fines.xes\",\n            \"Road_Traffic_Fine_Management_Process.xes\",\n            \"ROAD.xes\",\n        ],\n    }\n    for name, files in candidates.items():\n        df = None\n        if PM4PY_AVAILABLE:\n            for fn in files:\n                path = os.path.join(data_dir, fn)\n                if os.path.exists(path):\n                    try:\n                        log = xes_importer.apply(path)\n                        df = xes_to_df(log)\n                        break\n                    except Exception as e:\n                        print(f\"[warn] Failed to load {path}: {e}\")\n        if df is None:\n            # Fallback synthetic data to keep script executable\n            print(f\"[info] Using synthetic data for {name} (no XES found).\")\n            df = generate_synthetic_df(n_cases=300, max_len=15, n_acts=20)\n        datasets[name] = df\n    return datasets\n\n\n# Build prefixes\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n        if len(df) == 0:\n            df = df.sort_values([\"case_id\", \"timestamp\"])\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}  # 0 for PAD\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        ts_ns = pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy()\n        ts = (ts_ns // 10**9).astype(np.int64)\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str).tolist()], dtype=np.int64\n        )\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            seq_acts = acts_ids[:k].tolist()\n            seq_feats = feats[:k]\n            target = int(acts_ids[k])\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": seq_acts,\n                    \"seq_feats\": seq_feats.copy(),\n                    \"target\": target,\n                    \"last_ts\": int(ts[k - 1]),\n                    \"next_ts\": int(ts[k]),\n                }\n            )\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n    ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n    for s in samples:\n        if s[\"seq_feats\"].shape[0] > 0:\n            s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n            s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\n# Time-based split by case start time\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self,\n        vocab_size,\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=0,\n        dropout=0.2,\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(dropout)\n        self.fc = nn.Linear(hidden, vocab_size + 1)  # includes PAD index\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    out = {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, preds_probs = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            preds_probs.append(probs.detach().cpu().numpy())\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys)\n    y_pred = np.array(preds_top1)\n    mask = y_true != pad_idx\n    y_true = y_true[mask]\n    y_pred = y_pred[mask]\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    probs_concat = (\n        np.concatenate(preds_probs, axis=0)\n        if len(preds_probs) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return avg_loss, acc, f1, top3, y_true, y_pred, probs_concat\n\n\ndef train_model(\n    ds_train,\n    ds_val,\n    vocab_size,\n    pad_id,\n    epochs=20,\n    batch_size=128,\n    lr=1e-3,\n    max_prefix_len=10,\n    dropout=0.2,\n):\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=True,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n\n    model = LSTMBaseline(\n        vocab_size=vocab_size,\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n        dropout=dropout,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    best_state = None\n    best_val_top3 = -1.0\n    hist = {\n        \"train_loss\": [],\n        \"val_loss\": [],\n        \"val_top3\": [],\n        \"val_acc\": [],\n        \"val_f1\": [],\n    }\n\n    for epoch in range(1, epochs + 1):\n        model.train()\n        total = 0\n        running_loss = 0.0\n        for batch in dl_train:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            optimizer.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item() * logits.size(0)\n            total += logits.size(0)\n        train_loss = running_loss / max(1, total)\n        val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n            model, dl_val, criterion, device, vocab_size, pad_id\n        )\n        hist[\"train_loss\"].append(train_loss)\n        hist[\"val_loss\"].append(val_loss)\n        hist[\"val_top3\"].append(val_top3)\n        hist[\"val_acc\"].append(val_acc)\n        hist[\"val_f1\"].append(val_f1)\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_state = {\n                k: v.detach().cpu().clone() for k, v in model.state_dict().items()\n            }\n\n    # Load best weights\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n\n    return model, hist, best_val_top3\n\n\ndef train_one_dataset(\n    name, df, base_epochs_check=20, batch_size=128, max_prefix_len=10, lr=1e-3\n):\n    print(f\"\\n=== Dataset: {name} ===\")\n    # Time-based split\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # Re-normalize using train\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm_samples(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm_samples(samples_train)\n            norm_samples(samples_val)\n            norm_samples(samples_test)\n\n    print(\n        f\"Samples train/val/test: {len(samples_train)}/{len(samples_val)}/{len(samples_test)}; vocab={len(act2id)}\"\n    )\n    if len(samples_train) == 0 or len(act2id) < 2:\n        print(\"Not enough data to train. Skipping.\")\n        return None\n\n    ds_train = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_val = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_test = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n\n    # Step 1: Baseline training with dropout=0.2 for >10 epochs to check plateau\n    base_dropout = 0.2\n    model_base, hist_base, best_val_top3_base = train_model(\n        ds_train,\n        ds_val,\n        vocab_size=len(act2id),\n        pad_id=pad_id,\n        epochs=base_epochs_check,\n        batch_size=batch_size,\n        lr=lr,\n        max_prefix_len=max_prefix_len,\n        dropout=base_dropout,\n    )\n    # Analyze improvement beyond epoch 10\n    first_half_best = (\n        max(hist_base[\"val_top3\"][:10])\n        if len(hist_base[\"val_top3\"]) >= 10\n        else max(hist_base[\"val_top3\"], default=0.0)\n    )\n    second_half_best = (\n        max(hist_base[\"val_top3\"][10:])\n        if len(hist_base[\"val_top3\"]) > 10\n        else first_half_best\n    )\n    improvement = second_half_best - first_half_best\n    print(\n        f\"[{name}] Validation top-3 first10={first_half_best:.4f}, next={second_half_best:.4f}, delta={improvement:.4f}\"\n    )\n\n    # Decide whether to tune dropout\n    tune_dropout = improvement <= 1e-3  # plateau or degrade\n    chosen_dropout = base_dropout\n    tuning_results = []\n\n    if tune_dropout:\n        print(f\"[{name}] Plateau/degrade detected. Tuning dropout...\")\n        sweep = [0.0, 0.1, 0.2, 0.3, 0.5]\n        best_sweep_score = -1.0\n        best_sweep_dropout = base_dropout\n        for dr in sweep:\n            model_tmp, hist_tmp, best_val_top3_tmp = train_model(\n                ds_train,\n                ds_val,\n                vocab_size=len(act2id),\n                pad_id=pad_id,\n                epochs=15,\n                batch_size=batch_size,\n                lr=lr,\n                max_prefix_len=max_prefix_len,\n                dropout=dr,\n            )\n            tuning_results.append(\n                {\"dropout\": dr, \"hist\": hist_tmp, \"best_val_top3\": best_val_top3_tmp}\n            )\n            print(f\"[{name}] Dropout={dr:.2f} best val top-3={best_val_top3_tmp:.4f}\")\n            if best_val_top3_tmp > best_sweep_score:\n                best_sweep_score = best_val_top3_tmp\n                best_sweep_dropout = dr\n        chosen_dropout = best_sweep_dropout\n        print(\n            f\"[{name}] Chosen dropout={chosen_dropout:.2f} with val top-3={best_sweep_score:.4f}\"\n        )\n        # Retrain final model with chosen dropout for base_epochs_check epochs\n        final_model, final_hist, _ = train_model(\n            ds_train,\n            ds_val,\n            vocab_size=len(act2id),\n            pad_id=pad_id,\n            epochs=base_epochs_check,\n            batch_size=batch_size,\n            lr=lr,\n            max_prefix_len=max_prefix_len,\n            dropout=chosen_dropout,\n        )\n        model_used = final_model\n        hist_used = final_hist\n    else:\n        print(\n            f\"[{name}] Continued improvement beyond epoch 10. Keeping baseline dropout={base_dropout}.\"\n        )\n        model_used = model_base\n        hist_used = hist_base\n\n    # Final evaluation on train/val/test\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_test = DataLoader(\n        ds_test,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    criterion = nn.CrossEntropyLoss().to(device)\n\n    train_loss, train_acc, train_f1, train_top3, _, _, _ = evaluate(\n        model_used, dl_train, criterion, device, len(act2id), pad_id\n    )\n    val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n        model_used, dl_val, criterion, device, len(act2id), pad_id\n    )\n    test_loss, test_acc, test_f1, test_top3, y_true_t, y_pred_t, probs_t = evaluate(\n        model_used, dl_test, criterion, device, len(act2id), pad_id\n    )\n    print(\n        f\"[{name}] Train: loss={train_loss:.4f} acc={train_acc:.4f} f1={train_f1:.4f} top3={train_top3:.4f}\"\n    )\n    print(\n        f\"[{name}] Test:  loss={test_loss:.4f} acc={test_acc:.4f} f1={test_f1:.4f} top3={test_top3:.4f}\"\n    )\n\n    # Store results to experiment_data\n    experiment_data[\"dropout_tuning\"][name] = {\n        \"config\": {\n            \"max_prefix_len\": max_prefix_len,\n            \"batch_size\": batch_size,\n            \"lr\": lr,\n            \"base_epochs_check\": base_epochs_check,\n            \"pad_id\": pad_id,\n            \"vocab_size\": len(act2id),\n        },\n        \"diagnostics\": {\n            \"baseline_dropout\": base_dropout,\n            \"plateau_detected\": bool(tune_dropout),\n            \"first10_best_val_top3\": float(first_half_best),\n            \"next_best_val_top3\": float(second_half_best),\n            \"delta\": float(improvement),\n            \"chosen_dropout\": float(chosen_dropout),\n            \"tuning_results\": [\n                {\n                    \"dropout\": float(tr[\"dropout\"]),\n                    \"best_val_top3\": float(tr[\"best_val_top3\"]),\n                    \"hist_val_top3\": np.array(tr[\"hist\"][\"val_top3\"]).tolist(),\n                    \"hist_val_loss\": np.array(tr[\"hist\"][\"val_loss\"]).tolist(),\n                }\n                for tr in tuning_results\n            ],\n        },\n        \"metrics\": {\n            \"train\": [\n                {\n                    \"loss\": float(train_loss),\n                    \"acc\": float(train_acc),\n                    \"macro_f1\": float(train_f1),\n                    \"top3\": float(train_top3),\n                }\n            ],\n            \"val\": [\n                {\n                    \"loss\": float(val_loss),\n                    \"acc\": float(val_acc),\n                    \"macro_f1\": float(val_f1),\n                    \"top3\": float(val_top3),\n                }\n            ],\n            \"test\": [\n                {\n                    \"loss\": float(test_loss),\n                    \"acc\": float(test_acc),\n                    \"macro_f1\": float(test_f1),\n                    \"top3\": float(test_top3),\n                }\n            ],\n        },\n        \"losses\": {\n            \"train\": np.array(hist_used[\"train_loss\"]).tolist(),\n            \"val\": np.array(hist_used[\"val_loss\"]).tolist(),\n        },\n        \"val_top3_curve\": np.array(hist_used[\"val_top3\"]).tolist(),\n        \"val_acc_curve\": np.array(hist_used[\"val_acc\"]).tolist(),\n        \"val_f1_curve\": np.array(hist_used[\"val_f1\"]).tolist(),\n        \"predictions\": np.array(y_pred_t).tolist(),\n        \"ground_truth\": np.array(y_true_t).tolist(),\n        \"probs\": probs_t.tolist(),\n        \"id2act\": {\n            int(k): str(v)\n            for k, v in (\n                {k: v for k, v in enumerate(sorted(act2id.keys()), start=1)}\n            ).items()\n        },\n    }\n    return True\n\n\ndef main():\n    datasets = load_local_datasets()\n    for key, df in datasets.items():\n        # Optionally cap to 5000 earliest cases\n        try:\n            starts = (\n                df.sort_values(\"timestamp\")\n                .groupby(\"case_id\")[\"timestamp\"]\n                .min()\n                .reset_index()\n            )\n            if len(starts) > 5000:\n                keep_cases = set(starts.iloc[:5000][\"case_id\"])\n                df_small = df[df[\"case_id\"].isin(keep_cases)].copy()\n            else:\n                df_small = df\n        except Exception:\n            df_small = df\n        train_one_dataset(\n            key,\n            df_small,\n            base_epochs_check=20,\n            batch_size=128,\n            max_prefix_len=10,\n            lr=1e-3,\n        )\n\n    # Save all experiment data as a single numpy file\n    np.save(\n        os.path.join(working_dir, \"experiment_data.npy\"),\n        experiment_data,\n        allow_pickle=True,\n    )\n\n\nif __name__ == \"__main__\":\n    main()\n","plan":"Hyperparam tuning name: dropout_rate.\nI'll expose dropout as a hyperparameter in LSTMBaseline and pass it from train_one_dataset. First, I train a baseline model with dropout=0.2 for 20 epochs to check if validation top-3 improves beyond epoch 10; if it plateaus or degrades, I perform a small dropout sweep over {0.0, 0.1, 0.2, 0.3, 0.5} to pick the best validation top-3. I use pm4py to load local XES logs (falling back to a synthetic dataset if unavailable), perform time-based splits, and evaluate with accuracy, macro-F1, and top-3. All metrics, losses, predictions, and tuning diagnostics are stored in a single experiment_data dictionary and saved to experiment_data.npy.","overall_plan":"","plot_code":null,"plot_plan":null,"step":6,"id":"4b69709685c641ddb0c83c8ee9b5d661","ctime":1757758935.9756742,"_term_out":["Using device: cuda","\n","Execution time: a second seconds (time limit is an hour)."],"parse_metrics_plan":"","parse_metrics_code":"","parse_term_out":null,"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":1.3738315105438232,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"The execution output is clearly incomplete: it only shows \"Using device: cuda\" and a generic execution time, without any of the numerous expected logs (dataset discovery, synthetic-data fallbacks, sample counts, training epochs, validation metrics, per-dataset test metrics). This strongly indicates that the main pipeline did not execute or terminated silently. Likely issues and fixes:\n\n1) Data path mismatch: The script only looks for XES files under ./data, whereas the workspace provides logs under ./input (per constraints and the provided robust loader). As a result it always falls back to synthetic data, but even then it should have printed synthetic-data messages. Fix: Replace load_local_datasets with the provided robust loader (ai_scientist/ideas/my_research_topic.py: load_datasets) that searches input/ and common fallbacks; or extend current loader to check ./input and .xes.gz and fuzzy patterns.\n\n2) Silent failure/early exit: Given the absence of any prints from training, an exception likely occurred before or during dataset iteration. Add try/except around main() and around per-dataset training to surface stack traces. Ensure stdout is flushed between stages and print dataset keys before training starts.\n\n3) Dependency handling: If pm4py is unavailable, the code sets PM4PY_AVAILABLE=False and should use synthetic data. However, if pm4py import partially succeeds but fails on loading a file, it might throw and break the loop. Ensure exceptions are caught and logged, and the fallback to synthetic is triggered per dataset.\n\n4) CUDA issues: Selecting cuda may cause device/memory errors that abort silently in some environments. Add a safe-device selection (try CUDA, otherwise fallback to CPU) and wrap training with explicit error handling; allow an env var to force CPU for debugging.\n\n5) Compliance gaps: The stage requires evaluation on BPI 2017 and Road logs with time-based splits and reporting metrics. Even if synthetic fallback is used, the output should report per-log metrics (acc, macro-F1, top-3). Ensure these prints occur and the experiment_data.npy is saved. Add final summary printout of per-dataset metrics.\n\n6) Minor robustness: Avoid using deprecated pandas int64 casting on timestamps; use .view(\"int64\") on datetime64[ns, UTC] or use .astype('int64') guarded with warnings filter.\n\nImplementing the robust data loader, adding explicit logging and exception handling around main/training, and allowing CPU fallback should make the run produce the expected per-dataset metrics and satisfy the constraints.","exp_results_dir":null,"metric":{"value":null,"maximize":null,"name":null,"description":null},"is_buggy":true,"is_buggy_plots":null,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":[],"plot_paths":[],"plot_analyses":[],"vlm_feedback_summary":[],"datasets_successfully_tested":[],"ablation_name":null,"hyperparam_name":"dropout_rate","is_seed_node":false,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"import os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score, confusion_matrix\nimport random\nfrom pathlib import Path\nimport math\nimport matplotlib.pyplot as plt\nfrom typing import Dict, List, Optional, Tuple\n\n# Device handling (CRITICAL GPU REQUIREMENTS)\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n# Experiment container\nexperiment_data = {\n    # Filled as:\n    # 'BPI2017': {'metrics': {'train': [], 'val': [], 'test': []}, 'losses': {'train': [], 'val': []}, ...}\n}\n\n\n# Reproducibility\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# ---------- Robust XES discovery & loading ----------\ndef _has_xes(dirpath: Path) -> bool:\n    try:\n        return dirpath.is_dir() and (\n            any(dirpath.glob(\"*.xes\")) or any(dirpath.glob(\"*.xes.gz\"))\n        )\n    except Exception:\n        return False\n\n\ndef _resolve_data_dir() -> Path:\n    candidates: List[Path] = []\n    candidates += [Path(\"input\").resolve(), (Path.cwd() / \"input\").resolve()]\n    cwd = Path.cwd().resolve()\n    for base in [cwd, *cwd.parents]:\n        candidates.append((base / \"data\").resolve())\n        candidates.append((base / \"input\").resolve())\n    candidates += [\n        Path(\"/workspace/input\"),\n        Path(\"/workspace/data\"),\n        Path(\"/workspace/ai_scientist/data\"),\n        Path(\"/workspace/AI-Scientist-v2/data\"),\n        Path(\"/workspace/experiments/data\"),\n        Path(\"/workspace/ai_scientist/input\"),\n        Path(\"/workspace/experiments/input\"),\n    ]\n    seen = set()\n    for p in candidates:\n        if p in seen:\n            continue\n        seen.add(p)\n        if _has_xes(p):\n            print(f\"[data] Using discovered data dir: {p}\")\n            return p\n    tried = \"\\n  - \" + \"\\n  - \".join(str(c) for c in candidates)\n    raise FileNotFoundError(\n        \"Could not locate a directory containing .xes files.\\n\"\n        f\"Checked:{tried}\\n\"\n        \"Tips:\\n\"\n        \"  \u2022 Ensure filenames include BPI 2012/2017 or 'Road_Traffic_Fine_Management_Process' for auto-match.\"\n    )\n\n\ndef _first_match(d: Path, patterns: List[str]) -> Optional[Path]:\n    for pat in patterns:\n        for p in d.glob(pat):\n            if p.is_file():\n                return p\n    return None\n\n\ndef xes_to_df(xes_path: Path) -> pd.DataFrame:\n    try:\n        from pm4py.objects.log.importer.xes import importer as xes_importer\n    except Exception as e:\n        raise ImportError(\"pm4py is required. Install: pip install pm4py\") from e\n    print(f\"[data] Loading XES: {xes_path}\")\n    log = xes_importer.apply(str(xes_path))\n    rows = []\n    for tr in log:\n        case_id = tr.attributes.get(\"concept:name\") or tr.attributes.get(\n            \"case:concept:name\"\n        )\n        for e in tr:\n            rows.append(\n                {\n                    \"case_id\": str(case_id),\n                    \"activity\": str(e.get(\"concept:name\")),\n                    \"lifecycle\": str(e.get(\"lifecycle:transition\", \"complete\")),\n                    \"timestamp\": e.get(\"time:timestamp\"),\n                    \"resource\": str(e.get(\"org:resource\", \"System\")),\n                }\n            )\n    df = pd.DataFrame(rows)\n    df[\"timestamp\"] = pd.to_datetime(df[\"timestamp\"], utc=True, errors=\"coerce\")\n    df = df.dropna(subset=[\"timestamp\"]).reset_index(drop=True)\n    df = df[[\"case_id\", \"activity\", \"lifecycle\", \"timestamp\", \"resource\"]]\n    df = df.sort_values([\"case_id\", \"timestamp\"]).reset_index(drop=True)\n    return df\n\n\ndef load_datasets() -> Dict[str, pd.DataFrame]:\n    patterns = {\n        \"BPI2012\": [\"BPI_Challenge_2012*.xes*\", \"BPI2012*.xes*\", \"*2012*.xes*\"],\n        \"BPI2017\": [\"BPI_Challenge_2017*.xes*\", \"BPI2017*.xes*\", \"*2017*.xes*\"],\n        \"ROAD\": [\n            \"Road_Traffic_Fine_Management_Process*.xes*\",\n            \"*Traffic*Fine*.xes*\",\n            \"*Traffic*.xes*\",\n        ],\n    }\n    datasets: Dict[str, pd.DataFrame] = {}\n    try:\n        data_dir = _resolve_data_dir()\n        available = sorted(\n            [\n                p.name\n                for p in list(data_dir.glob(\"*.xes\")) + list(data_dir.glob(\"*.xes.gz\"))\n            ]\n        )\n        print(f\"[data] Available in {data_dir}: {available}\")\n        for key, pats in patterns.items():\n            p = _first_match(data_dir, pats)\n            if p is not None:\n                try:\n                    datasets[key] = xes_to_df(p)\n                    print(f\"[data] Loaded {key}: {p.name}, events={len(datasets[key])}\")\n                except Exception as e:\n                    print(f\"[warn] Failed to load {key} from {p}: {e}\")\n            else:\n                print(f\"[data] Not found for {key} (patterns {patterns[key]})\")\n    except Exception as e:\n        print(f\"[warn] Dataset discovery failed: {e}\")\n    return datasets\n\n\n# Synthetic fallback\ndef make_synthetic_df(n_cases=500, max_events=15, seed=42) -> pd.DataFrame:\n    rng = np.random.default_rng(seed)\n    activities = [\"A\", \"B\", \"C\", \"D\", \"E\", \"F\", \"G\"]\n    rows = []\n    base_time = int(pd.Timestamp(\"2020-01-01\", tz=\"UTC\").value // 10**9)\n    for c in range(n_cases):\n        T = int(rng.integers(3, max_events))\n        start = base_time + int(rng.integers(0, 60 * 60 * 24 * 30))\n        ts = np.cumsum(rng.integers(10, 3600, size=T)) + start\n        for t in ts:\n            rows.append(\n                {\n                    \"case_id\": f\"S{c:05d}\",\n                    \"activity\": str(rng.choice(activities)),\n                    \"timestamp\": pd.to_datetime(t, unit=\"s\", utc=True),\n                    \"lifecycle\": \"complete\",\n                    \"resource\": \"System\",\n                }\n            )\n    df = pd.DataFrame(rows).sort_values([\"case_id\", \"timestamp\"]).reset_index(drop=True)\n    return df\n\n\n# ---------- Prefix building and split ----------\ndef time_based_split(df: pd.DataFrame, train_frac=0.7, val_frac=0.15):\n    starts = df.groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\ndef build_prefix_dataset(df: pd.DataFrame, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n        if len(df) == 0:\n            df = df.sort_values([\"case_id\", \"timestamp\"])\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        ts = (\n            pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy() // 10**9\n        )\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str)], dtype=np.int64\n        )\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": acts_ids[:k].tolist(),\n                    \"seq_feats\": feats[:k].copy(),\n                    \"target\": int(acts_ids[k]),\n                }\n            )\n    # Standardize time deltas and since_start globally here (will re-fit on train later to avoid leakage)\n    if len(samples) > 0:\n        all_feats = np.concatenate(\n            [s[\"seq_feats\"] for s in samples if s[\"seq_feats\"].shape[0] > 0], axis=0\n        )\n        dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n        ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n        for s in samples:\n            if s[\"seq_feats\"].shape[0] > 0:\n                s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    return {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n\n\n# ---------- Model (unchanged architecture) ----------\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\n# ---------- Metrics ----------\ndef expected_calibration_error(\n    probs: np.ndarray, y_true: np.ndarray, n_bins: int = 15\n) -> float:\n    if probs.size == 0 or y_true.size == 0:\n        return 0.0\n    conf = probs.max(axis=1)\n    preds = probs.argmax(axis=1)\n    correct = (preds == y_true).astype(np.float32)\n    bins = np.linspace(0.0, 1.0, n_bins + 1)\n    ece = 0.0\n    for i in range(n_bins):\n        m = (conf > bins[i]) & (conf <= bins[i + 1])\n        if m.sum() == 0:\n            continue\n        acc_bin = correct[m].mean()\n        conf_bin = conf[m].mean()\n        ece += (m.mean()) * abs(acc_bin - conf_bin)\n    return float(ece)\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, preds_probs = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            preds_probs.append(probs.detach().cpu().numpy())\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys, dtype=np.int64)\n    y_pred = np.array(preds_top1, dtype=np.int64)\n    probs_concat = (\n        np.concatenate(preds_probs, axis=0)\n        if len(preds_probs) > 0\n        else np.zeros((0, num_classes + 1), dtype=np.float32)\n    )\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    ece = (\n        expected_calibration_error(probs_concat, y_true, n_bins=15)\n        if probs_concat.shape[0] > 0\n        else 0.0\n    )\n    return avg_loss, acc, f1, top3, ece, y_true, y_pred, probs_concat\n\n\n# ---------- Training / tuning ----------\ndef train_eval_one_setting(\n    ds_name,\n    df,\n    batch_size=128,\n    max_epochs=12,\n    max_prefix_len=12,\n    lr=1e-3,\n    cap_cases=8000,\n):\n    # Cap cases for speed\n    try:\n        starts = (\n            df.groupby(\"case_id\")[\"timestamp\"]\n            .min()\n            .reset_index()\n            .sort_values(\"timestamp\")\n        )\n        if len(starts) > cap_cases:\n            keep_cases = set(starts.iloc[:cap_cases][\"case_id\"])\n            df = df[df[\"case_id\"].isin(keep_cases)].copy()\n    except Exception:\n        pass\n    # Split by time\n    train_cases, val_cases, test_cases = time_based_split(df, 0.70, 0.15)\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # Refit normalization on train only (avoid leakage)\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm(samples_train)\n            norm(samples_val)\n            norm(samples_test)\n    print(\n        f\"[{ds_name}] samples train/val/test: {len(samples_train)}/{len(samples_val)}/{len(samples_test)}, vocab={len(act2id)}\"\n    )\n    if len(samples_train) == 0 or len(act2id) < 2:\n        print(f\"[{ds_name}] Not enough data. Skipping.\")\n        return None\n\n    ds_tr = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_va = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_te = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    dl_tr = DataLoader(\n        ds_tr, batch_size=batch_size, shuffle=True, collate_fn=collate_fn, num_workers=0\n    )\n    dl_va = DataLoader(\n        ds_va,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_te = DataLoader(\n        ds_te,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n\n    model = LSTMBaseline(\n        vocab_size=len(act2id),\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    history = {\n        \"train_loss\": [],\n        \"val_loss\": [],\n        \"val_acc\": [],\n        \"val_f1\": [],\n        \"val_top3\": [],\n        \"val_ece\": [],\n    }\n    best_state = None\n    best_val_top3 = -1.0\n\n    for epoch in range(1, max_epochs + 1):\n        model.train()\n        total = 0\n        run_loss = 0.0\n        for batch in dl_tr:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            optimizer.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            loss.backward()\n            optimizer.step()\n            run_loss += loss.item() * logits.size(0)\n            total += logits.size(0)\n        tr_loss = run_loss / max(1, total)\n        val_loss, val_acc, val_f1, val_top3, val_ece, _, _, _ = evaluate(\n            model, dl_va, criterion, device, len(act2id), pad_id\n        )\n        print(\n            f\"[{ds_name}][bs={batch_size}, lr={lr}] Epoch {epoch}: validation_loss = {val_loss:.4f} acc={val_acc:.4f} f1={val_f1:.4f} top3={val_top3:.4f} ece={val_ece:.4f}\"\n        )\n        history[\"train_loss\"].append((epoch, float(tr_loss)))\n        history[\"val_loss\"].append((epoch, float(val_loss)))\n        history[\"val_acc\"].append((epoch, float(val_acc)))\n        history[\"val_f1\"].append((epoch, float(val_f1)))\n        history[\"val_top3\"].append((epoch, float(val_top3)))\n        history[\"val_ece\"].append((epoch, float(val_ece)))\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_state = {\n                k: v.detach().cpu().clone() for k, v in model.state_dict().items()\n            }\n\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n\n    (\n        train_loss,\n        train_acc,\n        train_f1,\n        train_top3,\n        train_ece,\n        y_true_tr,\n        y_pred_tr,\n        probs_tr,\n    ) = evaluate(model, dl_tr, criterion, device, len(act2id), pad_id)\n    val_loss, val_acc, val_f1, val_top3, val_ece, y_true_va, y_pred_va, probs_va = (\n        evaluate(model, dl_va, criterion, device, len(act2id), pad_id)\n    )\n    (\n        test_loss,\n        test_acc,\n        test_f1,\n        test_top3,\n        test_ece,\n        y_true_te,\n        y_pred_te,\n        probs_te,\n    ) = evaluate(model, dl_te, criterion, device, len(act2id), pad_id)\n\n    # Simple calibration plot for test\n    def plot_calibration(probs, y_true, title, out_path):\n        if probs.size == 0:\n            return\n        conf = probs.max(axis=1)\n        preds = probs.argmax(axis=1)\n        correct = (preds == y_true).astype(np.float32)\n        bins = np.linspace(0.0, 1.0, 11)\n        bin_ids = np.digitize(conf, bins) - 1\n        accs, confs, counts = [], [], []\n        for i in range(10):\n            m = bin_ids == i\n            if m.sum() == 0:\n                accs.append(0.0)\n                confs.append((bins[i] + bins[i + 1]) / 2)\n                counts.append(0)\n            else:\n                accs.append(correct[m].mean())\n                confs.append(conf[m].mean())\n                counts.append(m.sum())\n        plt.figure(figsize=(4, 4))\n        plt.plot([0, 1], [0, 1], \"k--\", label=\"Perfect\")\n        plt.plot(confs, accs, marker=\"o\", label=\"Model\")\n        plt.xlabel(\"Confidence\")\n        plt.ylabel(\"Accuracy\")\n        plt.title(title)\n        plt.legend()\n        plt.tight_layout()\n        plt.savefig(out_path)\n        plt.close()\n\n    plot_calibration(\n        probs_te,\n        y_true_te,\n        f\"{ds_name} Reliability (Test)\",\n        os.path.join(working_dir, f\"{ds_name}_reliability_test.png\"),\n    )\n\n    results = {\n        \"settings\": {\n            \"batch_size\": batch_size,\n            \"max_epochs\": max_epochs,\n            \"max_prefix_len\": max_prefix_len,\n            \"lr\": lr,\n            \"vocab_size\": len(act2id),\n        },\n        \"losses\": {\n            \"train\": history[\"train_loss\"],\n            \"val\": history[\"val_loss\"],\n        },\n        \"metrics\": {\n            \"train_final\": {\n                \"loss\": float(train_loss),\n                \"acc\": float(train_acc),\n                \"macro_f1\": float(train_f1),\n                \"top3\": float(train_top3),\n                \"ece\": float(train_ece),\n            },\n            \"val_final\": {\n                \"loss\": float(val_loss),\n                \"acc\": float(val_acc),\n                \"macro_f1\": float(val_f1),\n                \"top3\": float(val_top3),\n                \"ece\": float(val_ece),\n            },\n            \"test_final\": {\n                \"loss\": float(test_loss),\n                \"acc\": float(test_acc),\n                \"macro_f1\": float(test_f1),\n                \"top3\": float(test_top3),\n                \"ece\": float(test_ece),\n            },\n            \"val_curves\": {\n                \"acc\": history[\"val_acc\"],\n                \"macro_f1\": history[\"val_f1\"],\n                \"top3\": history[\"val_top3\"],\n                \"ece\": history[\"val_ece\"],\n            },\n        },\n        \"predictions\": {\n            \"train\": np.array(y_pred_tr, dtype=np.int64),\n            \"val\": np.array(y_pred_va, dtype=np.int64),\n            \"test\": np.array(y_pred_te, dtype=np.int64),\n        },\n        \"ground_truth\": {\n            \"train\": np.array(y_true_tr, dtype=np.int64),\n            \"val\": np.array(y_true_va, dtype=np.int64),\n            \"test\": np.array(y_true_te, dtype=np.int64),\n        },\n        \"probs\": {\n            \"train\": probs_tr,\n            \"val\": probs_va,\n            \"test\": probs_te,\n        },\n        \"act2id\": act2id,\n        \"pad_idx\": int(pad_id),\n    }\n    return results\n\n\ndef run_experiments():\n    # Load datasets with pm4py\n    datasets = load_datasets()\n    if len(datasets) == 0:\n        print(\"[info] No XES datasets found. Using synthetic dataset as fallback.\")\n        datasets = {\"SYNTH\": make_synthetic_df()}\n\n    # Hyperparameter grid (baseline tuning without changing architecture)\n    batch_grid = [64, 128, 256]\n    lr_grid = [5e-4, 1e-3]\n    max_epochs = 12\n    max_prefix_len = 12\n\n    for ds_name, df in datasets.items():\n        experiment_data.setdefault(\n            ds_name,\n            {\n                \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n                \"losses\": {\"train\": [], \"val\": []},\n                \"predictions\": [],\n                \"ground_truth\": [],\n                \"settings\": {},\n                \"best\": {},\n            },\n        )\n        best = {\"score\": -1.0, \"bs\": None, \"lr\": None, \"result\": None}\n        for bs in batch_grid:\n            for lr in lr_grid:\n                try:\n                    res = train_eval_one_setting(\n                        ds_name,\n                        df,\n                        batch_size=bs,\n                        max_epochs=max_epochs,\n                        max_prefix_len=max_prefix_len,\n                        lr=lr,\n                    )\n                except RuntimeError as e:\n                    print(\n                        f\"[warn][{ds_name}] Runtime error for batch_size={bs}, lr={lr}: {e}\"\n                    )\n                    res = None\n                key = f\"bs{bs}_lr{lr}\"\n                if res is None:\n                    continue\n                # Track per-epoch val loss for plotting\n                experiment_data[ds_name][\"losses\"][\"train\"].extend(\n                    res[\"losses\"][\"train\"]\n                )\n                experiment_data[ds_name][\"losses\"][\"val\"].extend(res[\"losses\"][\"val\"])\n                # Append metrics snapshots\n                experiment_data[ds_name][\"metrics\"][\"train\"].append(\n                    (\"final\", res[\"metrics\"][\"train_final\"])\n                )\n                experiment_data[ds_name][\"metrics\"][\"val\"].append(\n                    (\"final\", res[\"metrics\"][\"val_final\"])\n                )\n                experiment_data[ds_name][\"metrics\"][\"test\"].append(\n                    (\"final\", res[\"metrics\"][\"test_final\"])\n                )\n                experiment_data[ds_name][\"settings\"][key] = res[\"settings\"]\n                # Keep last predictions for the candidate\n                experiment_data[ds_name][\"predictions\"] = res[\"predictions\"][\"test\"]\n                experiment_data[ds_name][\"ground_truth\"] = res[\"ground_truth\"][\"test\"]\n                # Select best by validation top-3\n                val_top3 = res[\"metrics\"][\"val_final\"][\"top3\"]\n                if val_top3 > best[\"score\"]:\n                    best = {\"score\": val_top3, \"bs\": bs, \"lr\": lr, \"result\": res}\n        if best[\"result\"] is not None:\n            experiment_data[ds_name][\"best\"] = {\n                \"batch_size\": best[\"bs\"],\n                \"lr\": best[\"lr\"],\n                \"val_top3\": float(best[\"score\"]),\n                \"test_acc\": float(best[\"result\"][\"metrics\"][\"test_final\"][\"acc\"]),\n                \"test_top3\": float(best[\"result\"][\"metrics\"][\"test_final\"][\"top3\"]),\n                \"test_macro_f1\": float(\n                    best[\"result\"][\"metrics\"][\"test_final\"][\"macro_f1\"]\n                ),\n                \"test_ece\": float(best[\"result\"][\"metrics\"][\"test_final\"][\"ece\"]),\n            }\n            print(\n                f\"[{ds_name}] Best setting: bs={best['bs']} lr={best['lr']} | val_top3={best['score']:.4f} | test_acc={best['result']['metrics']['test_final']['acc']:.4f} test_top3={best['result']['metrics']['test_final']['top3']:.4f} ece={best['result']['metrics']['test_final']['ece']:.4f}\"\n            )\n        else:\n            print(f\"[{ds_name}] No successful runs.\")\n\n    # Save data\n    np.save(\n        os.path.join(working_dir, \"experiment_data.npy\"),\n        experiment_data,\n        allow_pickle=True,\n    )\n\n\n# Execute immediately\nrun_experiments()\n","plan":"The previous script failed to robustly discover and load local XES logs under input/, did not compute the required Expected Calibration Error (ECE), and wrapped execution under if __name__ == \"__main__\": which prevented immediate execution in some environments. I fix this by adding a resilient data directory resolver (preferring ./input with .xes/.xes.gz), aligning dataset name matching for BPI 2017 and Road Traffic Fine logs, and ensuring time-based splits. I keep the same 1-layer LSTM architecture but tune batch size and learning rate, track per-epoch validation metrics including ECE, and report/save per-dataset train/val/test metrics. I also add simple calibration plots and ensure all tensors/models are moved to the designated device.","overall_plan":"","plot_code":"import matplotlib.pyplot as plt\nimport numpy as np\nimport os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import (\n    f1_score,\n    accuracy_score,\n    confusion_matrix,\n    precision_recall_curve,\n    average_precision_score,\n)\nimport random\nfrom pathlib import Path\nimport math\nfrom typing import Dict, List, Optional, Tuple\n\n# Device handling\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\nexperiment_data = {}\n\n\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\ndef _has_xes(dirpath: Path) -> bool:\n    try:\n        return dirpath.is_dir() and (\n            any(dirpath.glob(\"*.xes\")) or any(dirpath.glob(\"*.xes.gz\"))\n        )\n    except Exception:\n        return False\n\n\ndef _resolve_data_dir() -> Path:\n    candidates: List[Path] = []\n    candidates += [Path(\"input\").resolve(), (Path.cwd() / \"input\").resolve()]\n    cwd = Path.cwd().resolve()\n    for base in [cwd, *cwd.parents]:\n        candidates.append((base / \"data\").resolve())\n        candidates.append((base / \"input\").resolve())\n    candidates += [\n        Path(\"/workspace/input\"),\n        Path(\"/workspace/data\"),\n        Path(\"/workspace/ai_scientist/data\"),\n        Path(\"/workspace/AI-Scientist-v2/data\"),\n        Path(\"/workspace/experiments/data\"),\n        Path(\"/workspace/ai_scientist/input\"),\n        Path(\"/workspace/experiments/input\"),\n    ]\n    seen = set()\n    for p in candidates:\n        if p in seen:\n            continue\n        seen.add(p)\n        if _has_xes(p):\n            print(f\"[data] Using discovered data dir: {p}\")\n            return p\n    tried = \"\\n  - \" + \"\\n  - \".join(str(c) for c in candidates)\n    raise FileNotFoundError(\n        \"Could not locate a directory containing .xes files.\\n\"\n        f\"Checked:{tried}\\n\"\n        \"Tips:\\n  \u2022 Ensure filenames include BPI 2012/2017 or 'Road_Traffic_Fine_Management_Process' for auto-match.\"\n    )\n\n\ndef _first_match(d: Path, patterns: List[str]) -> Optional[Path]:\n    for pat in patterns:\n        for p in d.glob(pat):\n            if p.is_file():\n                return p\n    return None\n\n\ndef xes_to_df(xes_path: Path) -> pd.DataFrame:\n    try:\n        from pm4py.objects.log.importer.xes import importer as xes_importer\n    except Exception as e:\n        raise ImportError(\"pm4py is required. Install: pip install pm4py\") from e\n    print(f\"[data] Loading XES: {xes_path}\")\n    log = xes_importer.apply(str(xes_path))\n    rows = []\n    for tr in log:\n        case_id = tr.attributes.get(\"concept:name\") or tr.attributes.get(\n            \"case:concept:name\"\n        )\n        for e in tr:\n            rows.append(\n                {\n                    \"case_id\": str(case_id),\n                    \"activity\": str(e.get(\"concept:name\")),\n                    \"lifecycle\": str(e.get(\"lifecycle:transition\", \"complete\")),\n                    \"timestamp\": e.get(\"time:timestamp\"),\n                    \"resource\": str(e.get(\"org:resource\", \"System\")),\n                }\n            )\n    df = pd.DataFrame(rows)\n    df[\"timestamp\"] = pd.to_datetime(df[\"timestamp\"], utc=True, errors=\"coerce\")\n    df = df.dropna(subset=[\"timestamp\"]).reset_index(drop=True)\n    df = df[[\"case_id\", \"activity\", \"lifecycle\", \"timestamp\", \"resource\"]]\n    df = df.sort_values([\"case_id\", \"timestamp\"]).reset_index(drop=True)\n    return df\n\n\ndef load_datasets() -> Dict[str, pd.DataFrame]:\n    patterns = {\n        \"BPI2012\": [\"BPI_Challenge_2012*.xes*\", \"BPI2012*.xes*\", \"*2012*.xes*\"],\n        \"BPI2017\": [\"BPI_Challenge_2017*.xes*\", \"BPI2017*.xes*\", \"*2017*.xes*\"],\n        \"ROAD\": [\n            \"Road_Traffic_Fine_Management_Process*.xes*\",\n            \"*Traffic*Fine*.xes*\",\n            \"*Traffic*.xes*\",\n        ],\n    }\n    datasets: Dict[str, pd.DataFrame] = {}\n    try:\n        data_dir = _resolve_data_dir()\n        available = sorted(\n            [\n                p.name\n                for p in list(data_dir.glob(\"*.xes\")) + list(data_dir.glob(\"*.xes.gz\"))\n            ]\n        )\n        print(f\"[data] Available in {data_dir}: {available}\")\n        for key, pats in patterns.items():\n            p = _first_match(data_dir, pats)\n            if p is not None:\n                try:\n                    datasets[key] = xes_to_df(p)\n                    print(f\"[data] Loaded {key}: {p.name}, events={len(datasets[key])}\")\n                except Exception as e:\n                    print(f\"[warn] Failed to load {key} from {p}: {e}\")\n            else:\n                print(f\"[data] Not found for {key} (patterns {patterns[key]})\")\n    except Exception as e:\n        print(f\"[warn] Dataset discovery failed: {e}\")\n    return datasets\n\n\ndef make_synthetic_df(n_cases=500, max_events=15, seed=42) -> pd.DataFrame:\n    rng = np.random.default_rng(seed)\n    activities = [\"A\", \"B\", \"C\", \"D\", \"E\", \"F\", \"G\"]\n    rows = []\n    base_time = int(pd.Timestamp(\"2020-01-01\", tz=\"UTC\").value // 10**9)\n    for c in range(n_cases):\n        T = int(rng.integers(3, max_events))\n        start = base_time + int(rng.integers(0, 60 * 60 * 24 * 30))\n        ts = np.cumsum(rng.integers(10, 3600, size=T)) + start\n        for t in ts:\n            rows.append(\n                {\n                    \"case_id\": f\"S{c:05d}\",\n                    \"activity\": str(rng.choice(activities)),\n                    \"timestamp\": pd.to_datetime(t, unit=\"s\", utc=True),\n                    \"lifecycle\": \"complete\",\n                    \"resource\": \"System\",\n                }\n            )\n    df = pd.DataFrame(rows).sort_values([\"case_id\", \"timestamp\"]).reset_index(drop=True)\n    return df\n\n\ndef time_based_split(df: pd.DataFrame, train_frac=0.7, val_frac=0.15):\n    starts = df.groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\ndef build_prefix_dataset(df: pd.DataFrame, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n        if len(df) == 0:\n            df = df.sort_values([\"case_id\", \"timestamp\"])\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        ts = (\n            pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy() // 10**9\n        )\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str)], dtype=np.int64\n        )\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": acts_ids[:k].tolist(),\n                    \"seq_feats\": feats[:k].copy(),\n                    \"target\": int(acts_ids[k]),\n                }\n            )\n    if len(samples) > 0:\n        all_feats = np.concatenate(\n            [s[\"seq_feats\"] for s in samples if s[\"seq_feats\"].shape[0] > 0], axis=0\n        )\n        dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n        ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n        for s in samples:\n            if s[\"seq_feats\"].shape[0] > 0:\n                s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    return {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = self.dropout(h[-1])\n        logits = self.fc(h_last)\n        return logits\n\n\ndef expected_calibration_error(\n    probs: np.ndarray, y_true: np.ndarray, n_bins: int = 15\n) -> float:\n    if probs.size == 0 or y_true.size == 0:\n        return 0.0\n    conf = probs.max(axis=1)\n    preds = probs.argmax(axis=1)\n    correct = (preds == y_true).astype(np.float32)\n    bins = np.linspace(0.0, 1.0, n_bins + 1)\n    ece = 0.0\n    for i in range(n_bins):\n        m = (conf > bins[i]) & (conf <= bins[i + 1])\n        if m.sum() == 0:\n            continue\n        acc_bin = correct[m].mean()\n        conf_bin = conf[m].mean()\n        ece += (m.mean()) * abs(acc_bin - conf_bin)\n    return float(ece)\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, preds_probs = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            preds_probs.append(probs.detach().cpu().numpy())\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys, dtype=np.int64)\n    y_pred = np.array(preds_top1, dtype=np.int64)\n    probs_concat = (\n        np.concatenate(preds_probs, axis=0)\n        if len(preds_probs) > 0\n        else np.zeros((0, num_classes + 1), dtype=np.float32)\n    )\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    ece = (\n        expected_calibration_error(probs_concat, y_true, n_bins=15)\n        if probs_concat.shape[0] > 0\n        else 0.0\n    )\n    return avg_loss, acc, f1, top3, ece, y_true, y_pred, probs_concat\n\n\ndef train_eval_one_setting(\n    ds_name,\n    df,\n    batch_size=128,\n    max_epochs=12,\n    max_prefix_len=12,\n    lr=1e-3,\n    cap_cases=8000,\n):\n    try:\n        starts = (\n            df.groupby(\"case_id\")[\"timestamp\"]\n            .min()\n            .reset_index()\n            .sort_values(\"timestamp\")\n        )\n        if len(starts) > cap_cases:\n            keep_cases = set(starts.iloc[:cap_cases][\"case_id\"])\n            df = df[df[\"case_id\"].isin(keep_cases)].copy()\n    except Exception:\n        pass\n    train_cases, val_cases, test_cases = time_based_split(df, 0.70, 0.15)\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm(samples_train)\n            norm(samples_val)\n            norm(samples_test)\n    print(\n        f\"[{ds_name}] samples train/val/test: {len(samples_train)}/{len(samples_val)}/{len(samples_test)}, vocab={len(act2id)}\"\n    )\n    if len(samples_train) == 0 or len(act2id) < 2:\n        print(f\"[{ds_name}] Not enough data. Skipping.\")\n        return None\n    ds_tr = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_va = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_te = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    dl_tr = DataLoader(\n        ds_tr, batch_size=batch_size, shuffle=True, collate_fn=collate_fn, num_workers=0\n    )\n    dl_va = DataLoader(\n        ds_va,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_te = DataLoader(\n        ds_te,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    model = LSTMBaseline(\n        vocab_size=len(act2id),\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n    history = {\n        \"train_loss\": [],\n        \"val_loss\": [],\n        \"val_acc\": [],\n        \"val_f1\": [],\n        \"val_top3\": [],\n        \"val_ece\": [],\n    }\n    best_state = None\n    best_val_top3 = -1.0\n    for epoch in range(1, max_epochs + 1):\n        model.train()\n        total = 0\n        run_loss = 0.0\n        for batch in dl_tr:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            optimizer.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            loss.backward()\n            optimizer.step()\n            run_loss += loss.item() * logits.size(0)\n            total += logits.size(0)\n        tr_loss = run_loss / max(1, total)\n        val_loss, val_acc, val_f1, val_top3, val_ece, _, _, _ = evaluate(\n            model, dl_va, criterion, device, len(act2id), pad_id\n        )\n        print(\n            f\"[{ds_name}][bs={batch_size}, lr={lr}] Epoch {epoch}: validation_loss = {val_loss:.4f} acc={val_acc:.4f} f1={val_f1:.4f} top3={val_top3:.4f} ece={val_ece:.4f}\"\n        )\n        history[\"train_loss\"].append((epoch, float(tr_loss)))\n        history[\"val_loss\"].append((epoch, float(val_loss)))\n        history[\"val_acc\"].append((epoch, float(val_acc)))\n        history[\"val_f1\"].append((epoch, float(val_f1)))\n        history[\"val_top3\"].append((epoch, float(val_top3)))\n        history[\"val_ece\"].append((epoch, float(val_ece)))\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_state = {\n                k: v.detach().cpu().clone() for k, v in model.state_dict().items()\n            }\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n    (\n        train_loss,\n        train_acc,\n        train_f1,\n        train_top3,\n        train_ece,\n        y_true_tr,\n        y_pred_tr,\n        probs_tr,\n    ) = evaluate(model, dl_tr, criterion, device, len(act2id), pad_id)\n    val_loss, val_acc, val_f1, val_top3, val_ece, y_true_va, y_pred_va, probs_va = (\n        evaluate(model, dl_va, criterion, device, len(act2id), pad_id)\n    )\n    (\n        test_loss,\n        test_acc,\n        test_f1,\n        test_top3,\n        test_ece,\n        y_true_te,\n        y_pred_te,\n        probs_te,\n    ) = evaluate(model, dl_te, criterion, device, len(act2id), pad_id)\n\n    def plot_calibration(probs, y_true, title, out_path):\n        if probs.size == 0:\n            return\n        conf = probs.max(axis=1)\n        preds = probs.argmax(axis=1)\n        correct = (preds == y_true).astype(np.float32)\n        bins = np.linspace(0.0, 1.0, 11)\n        bin_ids = np.digitize(conf, bins) - 1\n        accs, confs = [], []\n        for i in range(10):\n            m = bin_ids == i\n            if m.sum() == 0:\n                accs.append(0.0)\n                confs.append((bins[i] + bins[i + 1]) / 2)\n            else:\n                accs.append(correct[m].mean())\n                confs.append(conf[m].mean())\n        plt.figure(figsize=(4, 4))\n        plt.plot([0, 1], [0, 1], \"k--\", label=\"Perfect\")\n        plt.plot(confs, accs, marker=\"o\", label=\"Model\")\n        plt.xlabel(\"Confidence\")\n        plt.ylabel(\"Accuracy\")\n        plt.title(title)\n        plt.legend()\n        plt.tight_layout()\n        plt.savefig(out_path)\n        plt.close()\n\n    plot_calibration(\n        probs_te,\n        y_true_te,\n        f\"{ds_name} Reliability (Test)\",\n        os.path.join(working_dir, f\"{ds_name}_reliability_test.png\"),\n    )\n    results = {\n        \"settings\": {\n            \"batch_size\": batch_size,\n            \"max_epochs\": max_epochs,\n            \"max_prefix_len\": max_prefix_len,\n            \"lr\": lr,\n            \"vocab_size\": len(act2id),\n        },\n        \"losses\": {\"train\": history[\"train_loss\"], \"val\": history[\"val_loss\"]},\n        \"metrics\": {\n            \"train_final\": {\n                \"loss\": float(train_loss),\n                \"acc\": float(train_acc),\n                \"macro_f1\": float(train_f1),\n                \"top3\": float(train_top3),\n                \"ece\": float(train_ece),\n            },\n            \"val_final\": {\n                \"loss\": float(val_loss),\n                \"acc\": float(val_acc),\n                \"macro_f1\": float(val_f1),\n                \"top3\": float(val_top3),\n                \"ece\": float(val_ece),\n            },\n            \"test_final\": {\n                \"loss\": float(test_loss),\n                \"acc\": float(test_acc),\n                \"macro_f1\": float(test_f1),\n                \"top3\": float(test_top3),\n                \"ece\": float(test_ece),\n            },\n            \"val_curves\": {\n                \"acc\": history[\"val_acc\"],\n                \"macro_f1\": history[\"val_f1\"],\n                \"top3\": history[\"val_top3\"],\n                \"ece\": history[\"val_ece\"],\n            },\n        },\n        \"predictions\": {\n            \"train\": np.array(y_pred_tr, dtype=np.int64),\n            \"val\": np.array(y_pred_va, dtype=np.int64),\n            \"test\": np.array(y_pred_te, dtype=np.int64),\n        },\n        \"ground_truth\": {\n            \"train\": np.array(y_true_tr, dtype=np.int64),\n            \"val\": np.array(y_true_va, dtype=np.int64),\n            \"test\": np.array(y_true_te, dtype=np.int64),\n        },\n        \"probs\": {\"train\": probs_tr, \"val\": probs_va, \"test\": probs_te},\n        \"act2id\": act2id,\n        \"pad_idx\": int(pad_id),\n    }\n    return results\n\n\ndef run_experiments():\n    datasets = load_datasets()\n    if len(datasets) == 0:\n        print(\"[info] No XES datasets found. Using synthetic dataset as fallback.\")\n        datasets = {\"SYNTH\": make_synthetic_df()}\n    batch_grid = [64, 128, 256]\n    lr_grid = [5e-4, 1e-3]\n    max_epochs = 12\n    max_prefix_len = 12\n    for ds_name, df in datasets.items():\n        experiment_data.setdefault(\n            ds_name,\n            {\n                \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n                \"losses\": {\"train\": [], \"val\": []},\n                \"predictions\": [],\n                \"ground_truth\": [],\n                \"settings\": {},\n                \"best\": {},\n            },\n        )\n        best = {\"score\": -1.0, \"bs\": None, \"lr\": None, \"result\": None}\n        for bs in batch_grid:\n            for lr in lr_grid:\n                try:\n                    res = train_eval_one_setting(\n                        ds_name,\n                        df,\n                        batch_size=bs,\n                        max_epochs=max_epochs,\n                        max_prefix_len=max_prefix_len,\n                        lr=lr,\n                    )\n                except RuntimeError as e:\n                    print(\n                        f\"[warn][{ds_name}] Runtime error for batch_size={bs}, lr={lr}: {e}\"\n                    )\n                    res = None\n                key = f\"bs{bs}_lr{lr}\"\n                if res is None:\n                    continue\n                experiment_data[ds_name][\"losses\"][\"train\"].extend(\n                    res[\"losses\"][\"train\"]\n                )\n                experiment_data[ds_name][\"losses\"][\"val\"].extend(res[\"losses\"][\"val\"])\n                experiment_data[ds_name][\"metrics\"][\"train\"].append(\n                    (\"final\", res[\"metrics\"][\"train_final\"])\n                )\n                experiment_data[ds_name][\"metrics\"][\"val\"].append(\n                    (\"final\", res[\"metrics\"][\"val_final\"])\n                )\n                experiment_data[ds_name][\"metrics\"][\"test\"].append(\n                    (\"final\", res[\"metrics\"][\"test_final\"])\n                )\n                experiment_data[ds_name][\"settings\"][key] = res[\"settings\"]\n                experiment_data[ds_name][\"predictions\"] = res[\"predictions\"][\"test\"]\n                experiment_data[ds_name][\"ground_truth\"] = res[\"ground_truth\"][\"test\"]\n                val_top3 = res[\"metrics\"][\"val_final\"][\"top3\"]\n                if val_top3 > best[\"score\"]:\n                    best = {\"score\": val_top3, \"bs\": bs, \"lr\": lr, \"result\": res}\n        if best[\"result\"] is not None:\n            experiment_data[ds_name][\"best\"] = {\n                \"batch_size\": best[\"bs\"],\n                \"lr\": best[\"lr\"],\n                \"val_top3\": float(best[\"score\"]),\n                \"test_acc\": float(best[\"result\"][\"metrics\"][\"test_final\"][\"acc\"]),\n                \"test_top3\": float(best[\"result\"][\"metrics\"][\"test_final\"][\"top3\"]),\n                \"test_macro_f1\": float(\n                    best[\"result\"][\"metrics\"][\"test_final\"][\"macro_f1\"]\n                ),\n                \"test_ece\": float(best[\"result\"][\"metrics\"][\"test_final\"][\"ece\"]),\n            }\n            print(\n                f\"[{ds_name}] Best setting: bs={best['bs']} lr={best['lr']} | val_top3={best['score']:.4f} | test_acc={best['result']['metrics']['test_final']['acc']:.4f} test_top3={best['result']['metrics']['test_final']['top3']:.4f} ece={best['result']['metrics']['test_final']['ece']:.4f}\"\n            )\n        else:\n            print(f\"[{ds_name}] No successful runs.\")\n    np.save(\n        os.path.join(working_dir, \"experiment_data.npy\"),\n        experiment_data,\n        allow_pickle=True,\n    )\n\n\n# Train and save\nrun_experiments()\n\n# Load and Plot\ntry:\n    experiment_data = np.load(\n        os.path.join(working_dir, \"experiment_data.npy\"), allow_pickle=True\n    ).item()\nexcept Exception as e:\n    print(f\"Error loading experiment data: {e}\")\n\nfor ds_name, ds_blob in experiment_data.items():\n    # 1) Training/Validation Loss Curves\n    try:\n        plt.figure()\n        tr = ds_blob.get(\"losses\", {}).get(\"train\", [])\n        va = ds_blob.get(\"losses\", {}).get(\"val\", [])\n        if len(tr) > 0 or len(va) > 0:\n            if len(tr) > 0:\n                epochs_tr = [e for e, v in tr]\n                vals_tr = [v for e, v in tr]\n                plt.plot(epochs_tr, vals_tr, label=\"Train Loss\")\n            if len(va) > 0:\n                epochs_va = [e for e, v in va]\n                vals_va = [v for e, v in va]\n                plt.plot(epochs_va, vals_va, label=\"Val Loss\")\n            plt.xlabel(\"Epoch\")\n            plt.ylabel(\"Loss\")\n            plt.title(f\"{ds_name} Loss Curves (Next-Activity)\")\n            plt.legend()\n            plt.tight_layout()\n            plt.savefig(\n                os.path.join(working_dir, f\"{ds_name}_loss_curves_next_activity.png\")\n            )\n        plt.close()\n    except Exception as e:\n        print(f\"Error creating loss curves for {ds_name}: {e}\")\n        plt.close()\n\n    # 2) Confusion Matrix (Test)\n    try:\n        y_true = np.array(ds_blob.get(\"ground_truth\", []))\n        y_pred = np.array(ds_blob.get(\"predictions\", []))\n        if isinstance(y_true, dict):\n            y_true = y_true.get(\"test\", np.array([]))\n        if isinstance(y_pred, dict):\n            y_pred = y_pred.get(\"test\", np.array([]))\n        if y_true.size > 0 and y_pred.size > 0:\n            cm = confusion_matrix(y_true, y_pred)\n            plt.figure(figsize=(6, 5))\n            plt.imshow(cm, cmap=\"Blues\")\n            plt.colorbar()\n            plt.xlabel(\"Predicted\")\n            plt.ylabel(\"True\")\n            plt.title(f\"{ds_name} Confusion Matrix (Next-Activity, Test)\")\n            plt.tight_layout()\n            plt.savefig(\n                os.path.join(\n                    working_dir, f\"{ds_name}_confusion_matrix_next_activity_test.png\"\n                )\n            )\n            plt.close()\n        else:\n            plt.close()\n    except Exception as e:\n        print(f\"Error creating confusion matrix for {ds_name}: {e}\")\n        plt.close()\n\n    # 3) Macro Precision-Recall Curve (Test)\n    try:\n        probs = ds_blob.get(\"probs\", {}).get(\"test\", None)\n        y_true = ds_blob.get(\"ground_truth\", {}).get(\"test\", None)\n        if (\n            probs is not None\n            and y_true is not None\n            and len(probs) == len(y_true)\n            and len(y_true) > 0\n        ):\n            n_classes = probs.shape[1]\n            # Ignore padding class 0 if present by masking columns that are never true\n            classes = np.unique(y_true)\n            y_true_mat = np.zeros((len(y_true), n_classes), dtype=int)\n            for i, c in enumerate(y_true):\n                if c >= 0 and c < n_classes:\n                    y_true_mat[i, c] = 1\n            pr_areas = []\n            precisions_macro = []\n            recalls_macro = []\n            # Compute macro by averaging interpolated precision across classes present in truth\n            valid_classes = [c for c in range(n_classes) if y_true_mat[:, c].sum() > 0]\n            grid = np.linspace(0, 1, 101)\n            prec_accum = np.zeros_like(grid)\n            for c in valid_classes:\n                prec, rec, _ = precision_recall_curve(y_true_mat[:, c], probs[:, c])\n                # interpolate precision as function of recall\n                prec_interp = np.interp(\n                    grid, rec[::-1], prec[::-1], left=prec[0], right=prec[-1]\n                )\n                prec_accum += prec_interp\n                try:\n                    ap = average_precision_score(y_true_mat[:, c], probs[:, c])\n                    pr_areas.append(ap)\n                except Exception:\n                    pass\n            if len(valid_classes) > 0:\n                prec_macro = prec_accum / len(valid_classes)\n                plt.figure()\n                plt.plot(\n                    grid, prec_macro, label=f\"Macro-PR (AP~{np.mean(pr_areas):.3f})\"\n                )\n                plt.xlabel(\"Recall\")\n                plt.ylabel(\"Precision\")\n                plt.title(f\"{ds_name} Macro PR Curve (Next-Activity, Test)\")\n                plt.legend()\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(\n                        working_dir, f\"{ds_name}_macro_pr_next_activity_test.png\"\n                    )\n                )\n                plt.close()\n            else:\n                plt.close()\n        else:\n            plt.close()\n    except Exception as e:\n        print(f\"Error creating macro PR curve for {ds_name}: {e}\")\n        plt.close()\n\n# Print summary BPM metrics\nfor ds_name, ds_blob in experiment_data.items():\n    best = ds_blob.get(\"best\", {})\n    if best:\n        print(\n            f\"[RESULT] {ds_name} | Best bs={best.get('batch_size')} lr={best.get('lr')} | \"\n            f\"Test Acc={best.get('test_acc'):.4f} | Test Top-3={best.get('test_top3'):.4f} | \"\n            f\"Test Macro-F1={best.get('test_macro_f1'):.4f} | Test ECE={best.get('test_ece'):.4f}\"\n        )\n    else:\n        # try to print any available final test from first metric entry\n        tests = ds_blob.get(\"metrics\", {}).get(\"test\", [])\n        if len(tests) > 0 and isinstance(tests[0], tuple):\n            m = tests[0][1]\n            print(\n                f\"[RESULT] {ds_name} | Test Acc={m.get('acc', float('nan')):.4f} | Top-3={m.get('top3', float('nan')):.4f} | Macro-F1={m.get('macro_f1', float('nan')):.4f} | ECE={m.get('ece', float('nan')):.4f}\"\n            )\n","plot_plan":"We will build a next-activity prediction pipeline that loads local XES logs via pm4py, converts them to a sorted event DataFrame, and constructs time-based train/val/test splits by case start time. For each case we generate prefixes with contextual features and train a simple LSTM baseline over activity embeddings plus continuous features. We will tune basic hyperparameters (batch size and learning rate) with early model selection based on validation Top-3 accuracy and evaluate on the test split. We report BPM metrics for next-activity: accuracy, macro-F1, Top-3 accuracy, and calibration error (ECE), and we save a reliability plot. After training, we persist all results into experiment_data.npy. We then load experiment_data.npy to generate standard visualizations: training/validation loss curves, test confusion matrix, and macro precision-recall curves when probabilistic outputs exist. Each plot is saved to working_dir with dataset-specific filenames, wrapped in try-except blocks, and figures are always closed. Finally, we print best settings and test metrics per dataset to the console.","step":7,"id":"b6970d0586c74652a8d858ed9350bd81","ctime":1757759650.0756283,"_term_out":["Using device: cuda","\n","[data] Using discovered data dir: /workspace/data","\n","[data] Available in /workspace/data: ['BPI_Challenge_2012.xes', 'BPI_Challenge_2017.xes', 'Road_Traffic_Fine_Management_Process.xes']","\n","[data] Loading XES: /workspace/data/BPI_Challenge_2012.xes","\n","\rparsing log, completed traces ::   0%|          | 0/13087 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 1/13087 [00:00<22:14,  9.80it/s]","\rparsing log, completed traces ::   1%|1         | 160/13087 [00:00<00:13, 930.62it/s]","\rparsing log, completed traces ::   2%|2         | 318/13087 [00:00<00:10, 1223.23it/s]","\rparsing log, completed traces ::   3%|3         | 441/13087 [00:00<00:22, 557.56it/s] ","\rparsing log, completed traces ::   5%|4         | 605/13087 [00:00<00:16, 777.15it/s]","\rparsing log, completed traces ::   6%|6         | 793/13087 [00:00<00:11, 1025.33it/s]","\rparsing log, completed traces ::   7%|7         | 957/13087 [00:01<00:10, 1174.06it/s]","\rparsing log, completed traces ::   9%|8         | 1120/13087 [00:01<00:09, 1290.81it/s]","\rparsing log, completed traces ::  10%|9         | 1300/13087 [00:01<00:08, 1424.41it/s]","\rparsing log, completed traces ::  12%|#1        | 1510/13087 [00:01<00:07, 1608.89it/s]","\rparsing log, completed traces ::  13%|#2        | 1688/13087 [00:01<00:06, 1652.59it/s]","\rparsing log, completed traces ::  14%|#4        | 1864/13087 [00:01<00:06, 1678.86it/s]","\rparsing log, completed traces ::  16%|#5        | 2040/13087 [00:01<00:06, 1663.47it/s]","\rparsing log, completed traces ::  17%|#6        | 2215/13087 [00:01<00:06, 1684.41it/s]","\rparsing log, completed traces ::  18%|#8        | 2395/13087 [00:01<00:06, 1714.80it/s]","\rparsing log, completed traces ::  20%|#9        | 2575/13087 [00:01<00:06, 1736.49it/s]","\rparsing log, completed traces ::  21%|##1       | 2751/13087 [00:02<00:06, 1690.63it/s]","\rparsing log, completed traces ::  22%|##2       | 2922/13087 [00:02<00:06, 1688.68it/s]","\rparsing log, completed traces ::  24%|##3       | 3092/13087 [00:02<00:11, 845.22it/s] ","\rparsing log, completed traces ::  25%|##5       | 3308/13087 [00:02<00:09, 1071.87it/s]","\rparsing log, completed traces ::  27%|##6       | 3528/13087 [00:02<00:07, 1292.19it/s]","\rparsing log, completed traces ::  28%|##8       | 3716/13087 [00:02<00:06, 1419.37it/s]","\rparsing log, completed traces ::  30%|##9       | 3895/13087 [00:02<00:06, 1496.34it/s]","\rparsing log, completed traces ::  32%|###1      | 4142/13087 [00:03<00:05, 1742.16it/s]","\rparsing log, completed traces ::  33%|###3      | 4381/13087 [00:03<00:04, 1911.04it/s]","\rparsing log, completed traces ::  35%|###5      | 4600/13087 [00:03<00:04, 1984.66it/s]","\rparsing log, completed traces ::  37%|###6      | 4813/13087 [00:03<00:04, 1937.17it/s]","\rparsing log, completed traces ::  38%|###8      | 5021/13087 [00:03<00:04, 1975.62it/s]","\rparsing log, completed traces ::  40%|###9      | 5226/13087 [00:03<00:04, 1891.12it/s]","\rparsing log, completed traces ::  41%|####1     | 5421/13087 [00:03<00:04, 1869.95it/s]","\rparsing log, completed traces ::  43%|####2     | 5612/13087 [00:03<00:04, 1793.07it/s]","\rparsing log, completed traces ::  44%|####4     | 5795/13087 [00:03<00:04, 1782.39it/s]","\rparsing log, completed traces ::  46%|####5     | 5976/13087 [00:04<00:03, 1783.17it/s]","\rparsing log, completed traces ::  47%|####7     | 6156/13087 [00:04<00:03, 1734.66it/s]","\rparsing log, completed traces ::  49%|####8     | 6355/13087 [00:04<00:03, 1799.83it/s]","\rparsing log, completed traces ::  50%|####9     | 6537/13087 [00:04<00:07, 870.40it/s] ","\rparsing log, completed traces ::  51%|#####1    | 6697/13087 [00:04<00:06, 987.74it/s]","\rparsing log, completed traces ::  52%|#####2    | 6866/13087 [00:04<00:05, 1120.57it/s]","\rparsing log, completed traces ::  54%|#####3    | 7024/13087 [00:05<00:04, 1218.61it/s]","\rparsing log, completed traces ::  55%|#####4    | 7191/13087 [00:05<00:04, 1321.12it/s]","\rparsing log, completed traces ::  56%|#####6    | 7354/13087 [00:05<00:04, 1391.99it/s]","\rparsing log, completed traces ::  57%|#####7    | 7512/13087 [00:05<00:03, 1433.01it/s]","\rparsing log, completed traces ::  59%|#####8    | 7671/13087 [00:05<00:03, 1475.58it/s]","\rparsing log, completed traces ::  60%|######    | 7853/13087 [00:05<00:03, 1571.76it/s]","\rparsing log, completed traces ::  61%|######1   | 8018/13087 [00:05<00:03, 1520.25it/s]","\rparsing log, completed traces ::  63%|######2   | 8214/13087 [00:05<00:02, 1643.19it/s]","\rparsing log, completed traces ::  64%|######4   | 8387/13087 [00:05<00:02, 1666.68it/s]","\rparsing log, completed traces ::  66%|######5   | 8572/13087 [00:05<00:02, 1717.73it/s]","\rparsing log, completed traces ::  67%|######6   | 8749/13087 [00:06<00:02, 1729.01it/s]","\rparsing log, completed traces ::  68%|######8   | 8924/13087 [00:06<00:02, 1714.58it/s]","\rparsing log, completed traces ::  70%|######9   | 9097/13087 [00:06<00:02, 1692.68it/s]","\rparsing log, completed traces ::  71%|#######   | 9280/13087 [00:06<00:02, 1729.88it/s]","\rparsing log, completed traces ::  72%|#######2  | 9456/13087 [00:06<00:02, 1737.13it/s]","\rparsing log, completed traces ::  74%|#######3  | 9631/13087 [00:06<00:02, 1684.67it/s]","\rparsing log, completed traces ::  75%|#######4  | 9803/13087 [00:06<00:01, 1694.22it/s]","\rparsing log, completed traces ::  76%|#######6  | 9973/13087 [00:06<00:01, 1661.14it/s]","\rparsing log, completed traces ::  77%|#######7  | 10140/13087 [00:07<00:03, 743.57it/s]","\rparsing log, completed traces ::  79%|#######8  | 10287/13087 [00:07<00:03, 856.79it/s]","\rparsing log, completed traces ::  80%|#######9  | 10445/13087 [00:07<00:02, 986.28it/s]","\rparsing log, completed traces ::  81%|########  | 10592/13087 [00:07<00:02, 1085.92it/s]","\rparsing log, completed traces ::  82%|########2 | 10775/13087 [00:07<00:01, 1255.08it/s]","\rparsing log, completed traces ::  84%|########3 | 10967/13087 [00:07<00:01, 1413.69it/s]","\rparsing log, completed traces ::  85%|########5 | 11155/13087 [00:07<00:01, 1534.33it/s]","\rparsing log, completed traces ::  87%|########6 | 11340/13087 [00:08<00:01, 1617.72it/s]","\rparsing log, completed traces ::  88%|########8 | 11535/13087 [00:08<00:00, 1709.74it/s]","\rparsing log, completed traces ::  90%|########9 | 11727/13087 [00:08<00:00, 1769.40it/s]","\rparsing log, completed traces ::  91%|#########1| 11934/13087 [00:08<00:00, 1854.68it/s]","\rparsing log, completed traces ::  93%|#########2| 12126/13087 [00:08<00:00, 1862.42it/s]","\rparsing log, completed traces ::  94%|#########4| 12339/13087 [00:08<00:00, 1939.54it/s]","\rparsing log, completed traces ::  96%|#########5| 12539/13087 [00:08<00:00, 1955.82it/s]","\rparsing log, completed traces ::  97%|#########7| 12739/13087 [00:08<00:00, 1961.93it/s]","\rparsing log, completed traces ::  99%|#########8| 12946/13087 [00:08<00:00, 1992.93it/s]","","\rparsing log, completed traces :: 100%|##########| 13087/13087 [00:08<00:00, 1472.48it/s]","\n","[data] Loaded BPI2012: BPI_Challenge_2012.xes, events=262200","\n","[data] Loading XES: /workspace/data/BPI_Challenge_2017.xes","\n","\rparsing log, completed traces ::   0%|          | 0/31509 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 1/31509 [00:00<4:29:31,  1.95it/s]","\rparsing log, completed traces ::   0%|          | 70/31509 [00:00<03:28, 150.69it/s]","\rparsing log, completed traces ::   0%|          | 131/31509 [00:00<02:01, 258.53it/s]","\rparsing log, completed traces ::   1%|          | 202/31509 [00:00<01:24, 371.61it/s]","\rparsing log, completed traces ::   1%|          | 264/31509 [00:00<01:11, 436.81it/s]","\rparsing log, completed traces ::   1%|1         | 331/31509 [00:01<01:02, 499.90it/s]","\rparsing log, completed traces ::   1%|1         | 396/31509 [00:01<00:57, 539.75it/s]","\rparsing log, completed traces ::   1%|1         | 459/31509 [00:01<00:55, 563.84it/s]","\rparsing log, completed traces ::   2%|1         | 522/31509 [00:01<01:40, 308.62it/s]","\rparsing log, completed traces ::   2%|1         | 582/31509 [00:01<01:25, 360.45it/s]","\rparsing log, completed traces ::   2%|2         | 640/31509 [00:01<01:16, 403.17it/s]","\rparsing log, completed traces ::   2%|2         | 693/31509 [00:01<01:13, 416.51it/s]","\rparsing log, completed traces ::   2%|2         | 757/31509 [00:02<01:05, 468.95it/s]","\rparsing log, completed traces ::   3%|2         | 817/31509 [00:02<01:01, 501.59it/s]","\rparsing log, completed traces ::   3%|2         | 880/31509 [00:02<00:57, 532.35it/s]","\rparsing log, completed traces ::   3%|2         | 938/31509 [00:02<01:02, 492.64it/s]","\rparsing log, completed traces ::   3%|3         | 1008/31509 [00:02<00:55, 545.96it/s]","\rparsing log, completed traces ::   3%|3         | 1067/31509 [00:02<00:54, 555.28it/s]","\rparsing log, completed traces ::   4%|3         | 1134/31509 [00:02<00:51, 585.12it/s]","\rparsing log, completed traces ::   4%|3         | 1207/31509 [00:02<00:48, 623.93it/s]","\rparsing log, completed traces ::   4%|4         | 1276/31509 [00:02<00:47, 637.98it/s]","\rparsing log, completed traces ::   4%|4         | 1346/31509 [00:02<00:46, 654.98it/s]","\rparsing log, completed traces ::   4%|4         | 1413/31509 [00:03<00:45, 656.04it/s]","\rparsing log, completed traces ::   5%|4         | 1480/31509 [00:03<00:45, 657.56it/s]","\rparsing log, completed traces ::   5%|4         | 1550/31509 [00:03<00:44, 669.83it/s]","\rparsing log, completed traces ::   5%|5         | 1618/31509 [00:03<00:44, 666.66it/s]","\rparsing log, completed traces ::   5%|5         | 1685/31509 [00:03<00:45, 656.85it/s]","\rparsing log, completed traces ::   6%|5         | 1751/31509 [00:03<01:29, 333.71it/s]","\rparsing log, completed traces ::   6%|5         | 1814/31509 [00:04<01:17, 385.15it/s]","\rparsing log, completed traces ::   6%|5         | 1875/31509 [00:04<01:08, 429.58it/s]","\rparsing log, completed traces ::   6%|6         | 1944/31509 [00:04<01:00, 485.73it/s]","\rparsing log, completed traces ::   6%|6         | 2012/31509 [00:04<00:55, 532.24it/s]","\rparsing log, completed traces ::   7%|6         | 2080/31509 [00:04<00:51, 568.61it/s]","\rparsing log, completed traces ::   7%|6         | 2150/31509 [00:04<00:48, 602.76it/s]","\rparsing log, completed traces ::   7%|7         | 2220/31509 [00:04<00:46, 628.16it/s]","\rparsing log, completed traces ::   7%|7         | 2294/31509 [00:04<00:44, 654.98it/s]","\rparsing log, completed traces ::   7%|7         | 2363/31509 [00:04<00:44, 657.97it/s]","\rparsing log, completed traces ::   8%|7         | 2434/31509 [00:04<00:43, 671.95it/s]","\rparsing log, completed traces ::   8%|7         | 2504/31509 [00:05<00:42, 678.75it/s]","\rparsing log, completed traces ::   8%|8         | 2577/31509 [00:05<00:41, 692.77it/s]","\rparsing log, completed traces ::   8%|8         | 2652/31509 [00:05<00:40, 708.55it/s]","\rparsing log, completed traces ::   9%|8         | 2724/31509 [00:05<00:41, 697.87it/s]","\rparsing log, completed traces ::   9%|8         | 2799/31509 [00:05<00:40, 709.73it/s]","\rparsing log, completed traces ::   9%|9         | 2877/31509 [00:05<00:39, 728.86it/s]","\rparsing log, completed traces ::   9%|9         | 2954/31509 [00:05<00:38, 739.48it/s]","\rparsing log, completed traces ::  10%|9         | 3029/31509 [00:05<00:38, 731.33it/s]","\rparsing log, completed traces ::  10%|9         | 3103/31509 [00:06<01:19, 355.68it/s]","\rparsing log, completed traces ::  10%|#         | 3174/31509 [00:06<01:08, 413.94it/s]","\rparsing log, completed traces ::  10%|#         | 3241/31509 [00:06<01:01, 463.16it/s]","\rparsing log, completed traces ::  11%|#         | 3322/31509 [00:06<00:52, 536.71it/s]","\rparsing log, completed traces ::  11%|#         | 3398/31509 [00:06<00:47, 589.09it/s]","\rparsing log, completed traces ::  11%|#1        | 3477/31509 [00:06<00:43, 639.63it/s]","\rparsing log, completed traces ::  11%|#1        | 3550/31509 [00:06<00:42, 658.87it/s]","\rparsing log, completed traces ::  12%|#1        | 3627/31509 [00:06<00:40, 685.77it/s]","\rparsing log, completed traces ::  12%|#1        | 3702/31509 [00:07<00:39, 701.69it/s]","\rparsing log, completed traces ::  12%|#1        | 3776/31509 [00:07<00:39, 709.50it/s]","\rparsing log, completed traces ::  12%|#2        | 3850/31509 [00:07<00:39, 703.61it/s]","\rparsing log, completed traces ::  12%|#2        | 3924/31509 [00:07<00:38, 707.56it/s]","\rparsing log, completed traces ::  13%|#2        | 4004/31509 [00:07<00:37, 730.23it/s]","\rparsing log, completed traces ::  13%|#2        | 4078/31509 [00:07<00:37, 727.41it/s]","\rparsing log, completed traces ::  13%|#3        | 4152/31509 [00:07<00:37, 725.03it/s]","\rparsing log, completed traces ::  13%|#3        | 4225/31509 [00:07<00:38, 706.32it/s]","\rparsing log, completed traces ::  14%|#3        | 4297/31509 [00:07<00:39, 695.29it/s]","\rparsing log, completed traces ::  14%|#3        | 4367/31509 [00:07<00:38, 696.53it/s]","\rparsing log, completed traces ::  14%|#4        | 4440/31509 [00:08<00:38, 702.38it/s]","\rparsing log, completed traces ::  14%|#4        | 4511/31509 [00:08<00:38, 702.24it/s]","\rparsing log, completed traces ::  15%|#4        | 4582/31509 [00:08<00:38, 703.57it/s]","\rparsing log, completed traces ::  15%|#4        | 4653/31509 [00:08<01:23, 320.25it/s]","\rparsing log, completed traces ::  15%|#5        | 4732/31509 [00:08<01:07, 395.34it/s]","\rparsing log, completed traces ::  15%|#5        | 4803/31509 [00:08<00:58, 453.10it/s]","\rparsing log, completed traces ::  15%|#5        | 4877/31509 [00:09<00:52, 511.79it/s]","\rparsing log, completed traces ::  16%|#5        | 4948/31509 [00:09<00:47, 557.42it/s]","\rparsing log, completed traces ::  16%|#5        | 5022/31509 [00:09<00:44, 601.08it/s]","\rparsing log, completed traces ::  16%|#6        | 5101/31509 [00:09<00:40, 650.10it/s]","\rparsing log, completed traces ::  16%|#6        | 5174/31509 [00:09<00:39, 662.01it/s]","\rparsing log, completed traces ::  17%|#6        | 5250/31509 [00:09<00:38, 688.82it/s]","\rparsing log, completed traces ::  17%|#6        | 5323/31509 [00:09<00:37, 696.84it/s]","\rparsing log, completed traces ::  17%|#7        | 5396/31509 [00:09<00:37, 700.07it/s]","\rparsing log, completed traces ::  17%|#7        | 5470/31509 [00:09<00:36, 711.49it/s]","\rparsing log, completed traces ::  18%|#7        | 5546/31509 [00:10<00:35, 724.69it/s]","\rparsing log, completed traces ::  18%|#7        | 5622/31509 [00:10<00:35, 734.76it/s]","\rparsing log, completed traces ::  18%|#8        | 5703/31509 [00:10<00:34, 755.09it/s]","\rparsing log, completed traces ::  18%|#8        | 5781/31509 [00:10<00:33, 759.20it/s]","\rparsing log, completed traces ::  19%|#8        | 5858/31509 [00:10<00:33, 759.66it/s]","\rparsing log, completed traces ::  19%|#8        | 5938/31509 [00:10<00:33, 770.86it/s]","\rparsing log, completed traces ::  19%|#9        | 6016/31509 [00:10<00:33, 760.36it/s]","\rparsing log, completed traces ::  19%|#9        | 6093/31509 [00:10<00:34, 740.47it/s]","\rparsing log, completed traces ::  20%|#9        | 6170/31509 [00:10<00:33, 746.88it/s]","\rparsing log, completed traces ::  20%|#9        | 6246/31509 [00:10<00:33, 747.23it/s]","\rparsing log, completed traces ::  20%|##        | 6321/31509 [00:11<00:34, 733.99it/s]","\rparsing log, completed traces ::  20%|##        | 6395/31509 [00:11<00:34, 733.39it/s]","\rparsing log, completed traces ::  21%|##        | 6469/31509 [00:11<01:19, 314.19it/s]","\rparsing log, completed traces ::  21%|##        | 6533/31509 [00:11<01:08, 363.63it/s]","\rparsing log, completed traces ::  21%|##        | 6598/31509 [00:11<01:00, 413.89it/s]","\rparsing log, completed traces ::  21%|##1       | 6669/31509 [00:11<00:52, 473.78it/s]","\rparsing log, completed traces ::  21%|##1       | 6745/31509 [00:12<00:46, 536.92it/s]","\rparsing log, completed traces ::  22%|##1       | 6817/31509 [00:12<00:42, 580.54it/s]","\rparsing log, completed traces ::  22%|##1       | 6887/31509 [00:12<00:40, 608.13it/s]","\rparsing log, completed traces ::  22%|##2       | 6961/31509 [00:12<00:38, 641.37it/s]","\rparsing log, completed traces ::  22%|##2       | 7042/31509 [00:12<00:35, 687.12it/s]","\rparsing log, completed traces ::  23%|##2       | 7120/31509 [00:12<00:34, 711.64it/s]","\rparsing log, completed traces ::  23%|##2       | 7195/31509 [00:12<00:34, 696.20it/s]","\rparsing log, completed traces ::  23%|##3       | 7267/31509 [00:12<00:34, 702.03it/s]","\rparsing log, completed traces ::  23%|##3       | 7339/31509 [00:12<00:34, 696.83it/s]","\rparsing log, completed traces ::  24%|##3       | 7410/31509 [00:13<00:34, 699.50it/s]","\rparsing log, completed traces ::  24%|##3       | 7486/31509 [00:13<00:33, 712.06it/s]","\rparsing log, completed traces ::  24%|##4       | 7566/31509 [00:13<00:32, 735.14it/s]","\rparsing log, completed traces ::  24%|##4       | 7640/31509 [00:13<00:33, 715.19it/s]","\rparsing log, completed traces ::  24%|##4       | 7712/31509 [00:13<00:33, 711.09it/s]","\rparsing log, completed traces ::  25%|##4       | 7784/31509 [00:13<00:34, 693.59it/s]","\rparsing log, completed traces ::  25%|##4       | 7860/31509 [00:13<00:33, 711.88it/s]","\rparsing log, completed traces ::  25%|##5       | 7934/31509 [00:13<00:32, 717.15it/s]","\rparsing log, completed traces ::  25%|##5       | 8008/31509 [00:13<00:32, 723.46it/s]","\rparsing log, completed traces ::  26%|##5       | 8081/31509 [00:13<00:32, 719.61it/s]","\rparsing log, completed traces ::  26%|##5       | 8154/31509 [00:14<00:32, 719.46it/s]","\rparsing log, completed traces ::  26%|##6       | 8233/31509 [00:14<00:31, 738.63it/s]","\rparsing log, completed traces ::  26%|##6       | 8307/31509 [00:14<00:31, 731.82it/s]","\rparsing log, completed traces ::  27%|##6       | 8381/31509 [00:14<01:17, 297.83it/s]","\rparsing log, completed traces ::  27%|##6       | 8452/31509 [00:14<01:04, 357.94it/s]","\rparsing log, completed traces ::  27%|##7       | 8523/31509 [00:15<00:54, 418.53it/s]","\rparsing log, completed traces ::  27%|##7       | 8591/31509 [00:15<00:48, 470.16it/s]","\rparsing log, completed traces ::  27%|##7       | 8661/31509 [00:15<00:44, 517.53it/s]","\rparsing log, completed traces ::  28%|##7       | 8734/31509 [00:15<00:40, 567.39it/s]","\rparsing log, completed traces ::  28%|##7       | 8808/31509 [00:15<00:37, 609.83it/s]","\rparsing log, completed traces ::  28%|##8       | 8878/31509 [00:15<00:36, 625.14it/s]","\rparsing log, completed traces ::  28%|##8       | 8951/31509 [00:15<00:34, 651.58it/s]","\rparsing log, completed traces ::  29%|##8       | 9021/31509 [00:15<00:35, 641.64it/s]","\rparsing log, completed traces ::  29%|##8       | 9091/31509 [00:15<00:34, 655.53it/s]","\rparsing log, completed traces ::  29%|##9       | 9162/31509 [00:15<00:33, 670.14it/s]","\rparsing log, completed traces ::  29%|##9       | 9231/31509 [00:16<00:33, 663.47it/s]","\rparsing log, completed traces ::  30%|##9       | 9299/31509 [00:16<00:33, 667.52it/s]","\rparsing log, completed traces ::  30%|##9       | 9372/31509 [00:16<00:32, 685.19it/s]","\rparsing log, completed traces ::  30%|##9       | 9442/31509 [00:16<00:32, 682.53it/s]","\rparsing log, completed traces ::  30%|###       | 9513/31509 [00:16<00:31, 688.14it/s]","\rparsing log, completed traces ::  30%|###       | 9583/31509 [00:16<00:32, 684.43it/s]","\rparsing log, completed traces ::  31%|###       | 9656/31509 [00:16<00:31, 695.39it/s]","\rparsing log, completed traces ::  31%|###       | 9726/31509 [00:16<00:32, 671.66it/s]","\rparsing log, completed traces ::  31%|###1      | 9796/31509 [00:16<00:31, 679.24it/s]","\rparsing log, completed traces ::  31%|###1      | 9865/31509 [00:17<00:32, 674.38it/s]","\rparsing log, completed traces ::  32%|###1      | 9933/31509 [00:17<00:32, 673.54it/s]","\rparsing log, completed traces ::  32%|###1      | 10001/31509 [00:17<00:32, 663.58it/s]","\rparsing log, completed traces ::  32%|###1      | 10068/31509 [00:17<00:32, 663.51it/s]","\rparsing log, completed traces ::  32%|###2      | 10135/31509 [00:17<00:32, 648.46it/s]","\rparsing log, completed traces ::  32%|###2      | 10206/31509 [00:17<00:31, 666.29it/s]","\rparsing log, completed traces ::  33%|###2      | 10278/31509 [00:17<00:31, 681.75it/s]","\rparsing log, completed traces ::  33%|###2      | 10347/31509 [00:17<00:32, 658.60it/s]","\rparsing log, completed traces ::  33%|###3      | 10414/31509 [00:17<00:32, 657.89it/s]","\rparsing log, completed traces ::  33%|###3      | 10480/31509 [00:18<01:25, 245.99it/s]","\rparsing log, completed traces ::  33%|###3      | 10543/31509 [00:18<01:10, 297.54it/s]","\rparsing log, completed traces ::  34%|###3      | 10612/31509 [00:18<00:58, 359.78it/s]","\rparsing log, completed traces ::  34%|###3      | 10680/31509 [00:18<00:49, 419.33it/s]","\rparsing log, completed traces ::  34%|###4      | 10745/31509 [00:18<00:44, 466.72it/s]","\rparsing log, completed traces ::  34%|###4      | 10807/31509 [00:19<00:41, 497.92it/s]","\rparsing log, completed traces ::  34%|###4      | 10869/31509 [00:19<00:39, 520.18it/s]","\rparsing log, completed traces ::  35%|###4      | 10933/31509 [00:19<00:37, 550.88it/s]","\rparsing log, completed traces ::  35%|###4      | 11000/31509 [00:19<00:35, 580.73it/s]","\rparsing log, completed traces ::  35%|###5      | 11069/31509 [00:19<00:33, 610.94it/s]","\rparsing log, completed traces ::  35%|###5      | 11140/31509 [00:19<00:31, 638.56it/s]","\rparsing log, completed traces ::  36%|###5      | 11207/31509 [00:19<00:31, 641.15it/s]","\rparsing log, completed traces ::  36%|###5      | 11282/31509 [00:19<00:30, 668.90it/s]","\rparsing log, completed traces ::  36%|###6      | 11351/31509 [00:19<00:30, 666.31it/s]","\rparsing log, completed traces ::  36%|###6      | 11419/31509 [00:19<00:30, 658.52it/s]","\rparsing log, completed traces ::  36%|###6      | 11488/31509 [00:20<00:30, 664.96it/s]","\rparsing log, completed traces ::  37%|###6      | 11555/31509 [00:20<00:30, 652.59it/s]","\rparsing log, completed traces ::  37%|###6      | 11622/31509 [00:20<00:30, 654.68it/s]","\rparsing log, completed traces ::  37%|###7      | 11689/31509 [00:20<00:30, 658.26it/s]","\rparsing log, completed traces ::  37%|###7      | 11759/31509 [00:20<00:29, 667.85it/s]","\rparsing log, completed traces ::  38%|###7      | 11831/31509 [00:20<00:28, 680.48it/s]","\rparsing log, completed traces ::  38%|###7      | 11906/31509 [00:20<00:27, 700.29it/s]","\rparsing log, completed traces ::  38%|###8      | 11979/31509 [00:20<00:27, 707.88it/s]","\rparsing log, completed traces ::  38%|###8      | 12050/31509 [00:20<00:27, 706.13it/s]","\rparsing log, completed traces ::  38%|###8      | 12121/31509 [00:20<00:27, 694.71it/s]","\rparsing log, completed traces ::  39%|###8      | 12191/31509 [00:21<00:27, 691.38it/s]","\rparsing log, completed traces ::  39%|###8      | 12262/31509 [00:21<00:27, 696.00it/s]","\rparsing log, completed traces ::  39%|###9      | 12334/31509 [00:21<00:27, 703.06it/s]","\rparsing log, completed traces ::  39%|###9      | 12405/31509 [00:21<00:27, 697.08it/s]","\rparsing log, completed traces ::  40%|###9      | 12477/31509 [00:21<00:27, 700.33it/s]","\rparsing log, completed traces ::  40%|###9      | 12548/31509 [00:21<00:27, 684.63it/s]","\rparsing log, completed traces ::  40%|####      | 12619/31509 [00:21<00:27, 691.24it/s]","\rparsing log, completed traces ::  40%|####      | 12689/31509 [00:21<00:27, 693.67it/s]","\rparsing log, completed traces ::  40%|####      | 12761/31509 [00:21<00:26, 699.03it/s]","\rparsing log, completed traces ::  41%|####      | 12831/31509 [00:22<01:17, 241.46it/s]","\rparsing log, completed traces ::  41%|####      | 12899/31509 [00:22<01:02, 297.33it/s]","\rparsing log, completed traces ::  41%|####1     | 12968/31509 [00:22<00:51, 357.22it/s]","\rparsing log, completed traces ::  41%|####1     | 13040/31509 [00:22<00:43, 421.86it/s]","\rparsing log, completed traces ::  42%|####1     | 13118/31509 [00:23<00:37, 494.98it/s]","\rparsing log, completed traces ::  42%|####1     | 13186/31509 [00:23<00:34, 531.47it/s]","\rparsing log, completed traces ::  42%|####2     | 13255/31509 [00:23<00:32, 569.20it/s]","\rparsing log, completed traces ::  42%|####2     | 13325/31509 [00:23<00:30, 600.09it/s]","\rparsing log, completed traces ::  43%|####2     | 13397/31509 [00:23<00:28, 630.04it/s]","\rparsing log, completed traces ::  43%|####2     | 13466/31509 [00:23<00:28, 641.16it/s]","\rparsing log, completed traces ::  43%|####2     | 13537/31509 [00:23<00:27, 657.36it/s]","\rparsing log, completed traces ::  43%|####3     | 13606/31509 [00:23<00:26, 663.72it/s]","\rparsing log, completed traces ::  43%|####3     | 13675/31509 [00:23<00:27, 653.78it/s]","\rparsing log, completed traces ::  44%|####3     | 13747/31509 [00:23<00:26, 671.62it/s]","\rparsing log, completed traces ::  44%|####3     | 13816/31509 [00:24<00:26, 675.27it/s]","\rparsing log, completed traces ::  44%|####4     | 13885/31509 [00:24<00:26, 672.15it/s]","\rparsing log, completed traces ::  44%|####4     | 13958/31509 [00:24<00:25, 687.00it/s]","\rparsing log, completed traces ::  45%|####4     | 14030/31509 [00:24<00:25, 693.90it/s]","\rparsing log, completed traces ::  45%|####4     | 14100/31509 [00:24<00:25, 689.79it/s]","\rparsing log, completed traces ::  45%|####4     | 14175/31509 [00:24<00:24, 706.49it/s]","\rparsing log, completed traces ::  45%|####5     | 14246/31509 [00:24<00:24, 704.35it/s]","\rparsing log, completed traces ::  45%|####5     | 14319/31509 [00:24<00:24, 706.66it/s]","\rparsing log, completed traces ::  46%|####5     | 14397/31509 [00:24<00:23, 724.56it/s]","\rparsing log, completed traces ::  46%|####5     | 14470/31509 [00:24<00:23, 719.82it/s]","\rparsing log, completed traces ::  46%|####6     | 14543/31509 [00:25<00:24, 693.25it/s]","\rparsing log, completed traces ::  46%|####6     | 14613/31509 [00:25<00:24, 686.88it/s]","\rparsing log, completed traces ::  47%|####6     | 14683/31509 [00:25<00:24, 689.73it/s]","\rparsing log, completed traces ::  47%|####6     | 14754/31509 [00:25<00:24, 695.60it/s]","\rparsing log, completed traces ::  47%|####7     | 14828/31509 [00:25<00:23, 706.37it/s]","\rparsing log, completed traces ::  47%|####7     | 14899/31509 [00:25<00:23, 703.53it/s]","\rparsing log, completed traces ::  48%|####7     | 14975/31509 [00:25<00:22, 719.97it/s]","\rparsing log, completed traces ::  48%|####7     | 15048/31509 [00:25<00:22, 720.51it/s]","\rparsing log, completed traces ::  48%|####7     | 15121/31509 [00:25<00:22, 723.05it/s]","\rparsing log, completed traces ::  48%|####8     | 15198/31509 [00:26<00:22, 733.19it/s]","\rparsing log, completed traces ::  48%|####8     | 15272/31509 [00:26<00:22, 734.81it/s]","\rparsing log, completed traces ::  49%|####8     | 15350/31509 [00:26<00:21, 748.27it/s]","\rparsing log, completed traces ::  49%|####8     | 15426/31509 [00:26<00:21, 746.73it/s]","\rparsing log, completed traces ::  49%|####9     | 15501/31509 [00:26<00:21, 747.34it/s]","\rparsing log, completed traces ::  49%|####9     | 15576/31509 [00:27<01:04, 247.43it/s]","\rparsing log, completed traces ::  50%|####9     | 15650/31509 [00:27<00:51, 308.14it/s]","\rparsing log, completed traces ::  50%|####9     | 15724/31509 [00:27<00:42, 372.18it/s]","\rparsing log, completed traces ::  50%|#####     | 15796/31509 [00:27<00:36, 432.30it/s]","\rparsing log, completed traces ::  50%|#####     | 15872/31509 [00:27<00:31, 497.57it/s]","\rparsing log, completed traces ::  51%|#####     | 15946/31509 [00:27<00:28, 551.04it/s]","\rparsing log, completed traces ::  51%|#####     | 16017/31509 [00:27<00:26, 588.44it/s]","\rparsing log, completed traces ::  51%|#####1    | 16095/31509 [00:27<00:24, 637.04it/s]","\rparsing log, completed traces ::  51%|#####1    | 16176/31509 [00:27<00:22, 681.26it/s]","\rparsing log, completed traces ::  52%|#####1    | 16251/31509 [00:28<00:21, 694.81it/s]","\rparsing log, completed traces ::  52%|#####1    | 16328/31509 [00:28<00:21, 713.79it/s]","\rparsing log, completed traces ::  52%|#####2    | 16403/31509 [00:28<00:21, 691.64it/s]","\rparsing log, completed traces ::  52%|#####2    | 16475/31509 [00:28<00:21, 693.67it/s]","\rparsing log, completed traces ::  53%|#####2    | 16547/31509 [00:28<00:21, 693.79it/s]","\rparsing log, completed traces ::  53%|#####2    | 16621/31509 [00:28<00:21, 705.48it/s]","\rparsing log, completed traces ::  53%|#####2    | 16699/31509 [00:28<00:20, 727.09it/s]","\rparsing log, completed traces ::  53%|#####3    | 16773/31509 [00:28<00:20, 719.40it/s]","\rparsing log, completed traces ::  53%|#####3    | 16847/31509 [00:28<00:20, 722.59it/s]","\rparsing log, completed traces ::  54%|#####3    | 16925/31509 [00:29<00:19, 738.50it/s]","\rparsing log, completed traces ::  54%|#####3    | 17000/31509 [00:29<00:19, 735.96it/s]","\rparsing log, completed traces ::  54%|#####4    | 17084/31509 [00:29<00:18, 765.06it/s]","\rparsing log, completed traces ::  54%|#####4    | 17161/31509 [00:29<00:18, 755.74it/s]","\rparsing log, completed traces ::  55%|#####4    | 17237/31509 [00:29<00:19, 737.79it/s]","\rparsing log, completed traces ::  55%|#####4    | 17312/31509 [00:29<00:19, 740.96it/s]","\rparsing log, completed traces ::  55%|#####5    | 17387/31509 [00:29<00:19, 733.65it/s]","\rparsing log, completed traces ::  55%|#####5    | 17467/31509 [00:29<00:18, 751.80it/s]","\rparsing log, completed traces ::  56%|#####5    | 17543/31509 [00:29<00:19, 727.60it/s]","\rparsing log, completed traces ::  56%|#####5    | 17623/31509 [00:29<00:18, 747.92it/s]","\rparsing log, completed traces ::  56%|#####6    | 17699/31509 [00:30<00:18, 750.57it/s]","\rparsing log, completed traces ::  56%|#####6    | 17775/31509 [00:30<00:18, 751.04it/s]","\rparsing log, completed traces ::  57%|#####6    | 17855/31509 [00:30<00:17, 761.08it/s]","\rparsing log, completed traces ::  57%|#####6    | 17932/31509 [00:30<00:18, 754.06it/s]","\rparsing log, completed traces ::  57%|#####7    | 18010/31509 [00:30<00:17, 758.72it/s]","\rparsing log, completed traces ::  57%|#####7    | 18089/31509 [00:30<00:17, 765.65it/s]","\rparsing log, completed traces ::  58%|#####7    | 18166/31509 [00:30<00:17, 765.98it/s]","\rparsing log, completed traces ::  58%|#####7    | 18243/31509 [00:30<00:17, 754.90it/s]","\rparsing log, completed traces ::  58%|#####8    | 18319/31509 [00:30<00:17, 735.20it/s]","\rparsing log, completed traces ::  58%|#####8    | 18399/31509 [00:30<00:17, 751.48it/s]","\rparsing log, completed traces ::  59%|#####8    | 18475/31509 [00:31<00:17, 737.62it/s]","\rparsing log, completed traces ::  59%|#####8    | 18549/31509 [00:31<00:17, 722.08it/s]","\rparsing log, completed traces ::  59%|#####9    | 18622/31509 [00:31<00:17, 718.19it/s]","\rparsing log, completed traces ::  59%|#####9    | 18708/31509 [00:31<00:16, 758.67it/s]","\rparsing log, completed traces ::  60%|#####9    | 18785/31509 [00:32<00:54, 231.90it/s]","\rparsing log, completed traces ::  60%|#####9    | 18859/31509 [00:32<00:43, 289.25it/s]","\rparsing log, completed traces ::  60%|######    | 18942/31509 [00:32<00:34, 364.03it/s]","\rparsing log, completed traces ::  60%|######    | 19016/31509 [00:32<00:29, 424.89it/s]","\rparsing log, completed traces ::  61%|######    | 19093/31509 [00:32<00:25, 490.28it/s]","\rparsing log, completed traces ::  61%|######    | 19171/31509 [00:32<00:22, 551.07it/s]","\rparsing log, completed traces ::  61%|######1   | 19245/31509 [00:32<00:20, 589.08it/s]","\rparsing log, completed traces ::  61%|######1   | 19319/31509 [00:32<00:19, 623.92it/s]","\rparsing log, completed traces ::  62%|######1   | 19399/31509 [00:33<00:18, 667.99it/s]","\rparsing log, completed traces ::  62%|######1   | 19474/31509 [00:33<00:17, 688.25it/s]","\rparsing log, completed traces ::  62%|######2   | 19551/31509 [00:33<00:16, 710.89it/s]","\rparsing log, completed traces ::  62%|######2   | 19627/31509 [00:33<00:16, 707.52it/s]","\rparsing log, completed traces ::  63%|######2   | 19701/31509 [00:33<00:16, 705.76it/s]","\rparsing log, completed traces ::  63%|######2   | 19774/31509 [00:33<00:16, 712.10it/s]","\rparsing log, completed traces ::  63%|######2   | 19847/31509 [00:33<00:16, 701.53it/s]","\rparsing log, completed traces ::  63%|######3   | 19921/31509 [00:33<00:16, 711.49it/s]","\rparsing log, completed traces ::  63%|######3   | 19993/31509 [00:33<00:16, 705.64it/s]","\rparsing log, completed traces ::  64%|######3   | 20065/31509 [00:34<00:16, 708.60it/s]","\rparsing log, completed traces ::  64%|######3   | 20140/31509 [00:34<00:15, 720.65it/s]","\rparsing log, completed traces ::  64%|######4   | 20217/31509 [00:34<00:15, 734.94it/s]","\rparsing log, completed traces ::  64%|######4   | 20296/31509 [00:34<00:14, 748.63it/s]","\rparsing log, completed traces ::  65%|######4   | 20372/31509 [00:34<00:15, 729.61it/s]","\rparsing log, completed traces ::  65%|######4   | 20458/31509 [00:34<00:14, 764.30it/s]","\rparsing log, completed traces ::  65%|######5   | 20535/31509 [00:34<00:14, 763.01it/s]","\rparsing log, completed traces ::  65%|######5   | 20612/31509 [00:34<00:14, 764.08it/s]","\rparsing log, completed traces ::  66%|######5   | 20693/31509 [00:34<00:13, 776.29it/s]","\rparsing log, completed traces ::  66%|######5   | 20772/31509 [00:34<00:13, 776.62it/s]","\rparsing log, completed traces ::  66%|######6   | 20850/31509 [00:35<00:14, 758.15it/s]","\rparsing log, completed traces ::  66%|######6   | 20926/31509 [00:35<00:14, 748.02it/s]","\rparsing log, completed traces ::  67%|######6   | 21001/31509 [00:35<00:14, 739.99it/s]","\rparsing log, completed traces ::  67%|######6   | 21076/31509 [00:35<00:14, 731.80it/s]","\rparsing log, completed traces ::  67%|######7   | 21150/31509 [00:35<00:14, 725.18it/s]","\rparsing log, completed traces ::  67%|######7   | 21229/31509 [00:35<00:13, 742.42it/s]","\rparsing log, completed traces ::  68%|######7   | 21304/31509 [00:35<00:13, 739.17it/s]","\rparsing log, completed traces ::  68%|######7   | 21378/31509 [00:35<00:13, 730.74it/s]","\rparsing log, completed traces ::  68%|######8   | 21460/31509 [00:35<00:13, 756.49it/s]","\rparsing log, completed traces ::  68%|######8   | 21539/31509 [00:35<00:13, 764.53it/s]","\rparsing log, completed traces ::  69%|######8   | 21616/31509 [00:36<00:13, 760.42it/s]","\rparsing log, completed traces ::  69%|######8   | 21693/31509 [00:36<00:13, 746.19it/s]","\rparsing log, completed traces ::  69%|######9   | 21775/31509 [00:36<00:12, 767.58it/s]","\rparsing log, completed traces ::  69%|######9   | 21854/31509 [00:36<00:12, 772.41it/s]","\rparsing log, completed traces ::  70%|######9   | 21935/31509 [00:36<00:12, 782.70it/s]","\rparsing log, completed traces ::  70%|######9   | 22014/31509 [00:36<00:12, 772.50it/s]","\rparsing log, completed traces ::  70%|#######   | 22094/31509 [00:36<00:12, 779.83it/s]","\rparsing log, completed traces ::  70%|#######   | 22176/31509 [00:36<00:11, 787.00it/s]","\rparsing log, completed traces ::  71%|#######   | 22255/31509 [00:36<00:12, 766.91it/s]","\rparsing log, completed traces ::  71%|#######   | 22334/31509 [00:37<00:11, 771.03it/s]","\rparsing log, completed traces ::  71%|#######1  | 22412/31509 [00:37<00:11, 770.25it/s]","\rparsing log, completed traces ::  71%|#######1  | 22490/31509 [00:38<00:41, 216.83it/s]","\rparsing log, completed traces ::  72%|#######1  | 22563/31509 [00:38<00:33, 270.73it/s]","\rparsing log, completed traces ::  72%|#######1  | 22639/31509 [00:38<00:26, 334.35it/s]","\rparsing log, completed traces ::  72%|#######2  | 22715/31509 [00:38<00:21, 400.69it/s]","\rparsing log, completed traces ::  72%|#######2  | 22794/31509 [00:38<00:18, 471.33it/s]","\rparsing log, completed traces ::  73%|#######2  | 22872/31509 [00:38<00:16, 532.73it/s]","\rparsing log, completed traces ::  73%|#######2  | 22945/31509 [00:38<00:14, 571.67it/s]","\rparsing log, completed traces ::  73%|#######3  | 23018/31509 [00:38<00:13, 608.65it/s]","\rparsing log, completed traces ::  73%|#######3  | 23091/31509 [00:38<00:13, 638.06it/s]","\rparsing log, completed traces ::  74%|#######3  | 23164/31509 [00:38<00:12, 659.33it/s]","\rparsing log, completed traces ::  74%|#######3  | 23238/31509 [00:39<00:12, 680.45it/s]","\rparsing log, completed traces ::  74%|#######3  | 23311/31509 [00:39<00:11, 691.50it/s]","\rparsing log, completed traces ::  74%|#######4  | 23384/31509 [00:39<00:11, 693.87it/s]","\rparsing log, completed traces ::  74%|#######4  | 23458/31509 [00:39<00:11, 702.68it/s]","\rparsing log, completed traces ::  75%|#######4  | 23532/31509 [00:39<00:11, 712.34it/s]","\rparsing log, completed traces ::  75%|#######4  | 23609/31509 [00:39<00:10, 726.58it/s]","\rparsing log, completed traces ::  75%|#######5  | 23684/31509 [00:39<00:10, 733.27it/s]","\rparsing log, completed traces ::  75%|#######5  | 23760/31509 [00:39<00:10, 740.20it/s]","\rparsing log, completed traces ::  76%|#######5  | 23835/31509 [00:39<00:10, 733.77it/s]","\rparsing log, completed traces ::  76%|#######5  | 23910/31509 [00:40<00:10, 738.16it/s]","\rparsing log, completed traces ::  76%|#######6  | 23985/31509 [00:40<00:10, 739.59it/s]","\rparsing log, completed traces ::  76%|#######6  | 24060/31509 [00:40<00:10, 729.11it/s]","\rparsing log, completed traces ::  77%|#######6  | 24135/31509 [00:40<00:10, 732.83it/s]","\rparsing log, completed traces ::  77%|#######6  | 24209/31509 [00:40<00:10, 727.78it/s]","\rparsing log, completed traces ::  77%|#######7  | 24283/31509 [00:40<00:09, 730.53it/s]","\rparsing log, completed traces ::  77%|#######7  | 24361/31509 [00:40<00:09, 743.56it/s]","\rparsing log, completed traces ::  78%|#######7  | 24436/31509 [00:40<00:09, 726.93it/s]","\rparsing log, completed traces ::  78%|#######7  | 24514/31509 [00:40<00:09, 741.99it/s]","\rparsing log, completed traces ::  78%|#######8  | 24591/31509 [00:40<00:09, 748.14it/s]","\rparsing log, completed traces ::  78%|#######8  | 24670/31509 [00:41<00:08, 760.49it/s]","\rparsing log, completed traces ::  79%|#######8  | 24747/31509 [00:41<00:08, 756.72it/s]","\rparsing log, completed traces ::  79%|#######8  | 24823/31509 [00:41<00:08, 755.53it/s]","\rparsing log, completed traces ::  79%|#######9  | 24901/31509 [00:41<00:08, 760.23it/s]","\rparsing log, completed traces ::  79%|#######9  | 24981/31509 [00:41<00:08, 771.38it/s]","\rparsing log, completed traces ::  80%|#######9  | 25059/31509 [00:41<00:08, 749.31it/s]","\rparsing log, completed traces ::  80%|#######9  | 25135/31509 [00:41<00:08, 747.39it/s]","\rparsing log, completed traces ::  80%|########  | 25212/31509 [00:41<00:08, 751.89it/s]","\rparsing log, completed traces ::  80%|########  | 25288/31509 [00:41<00:08, 726.28it/s]","\rparsing log, completed traces ::  80%|########  | 25361/31509 [00:41<00:08, 726.76it/s]","\rparsing log, completed traces ::  81%|########  | 25435/31509 [00:42<00:08, 730.27it/s]","\rparsing log, completed traces ::  81%|########  | 25511/31509 [00:42<00:08, 737.67it/s]","\rparsing log, completed traces ::  81%|########1 | 25590/31509 [00:42<00:07, 749.24it/s]","\rparsing log, completed traces ::  81%|########1 | 25665/31509 [00:42<00:07, 733.35it/s]","\rparsing log, completed traces ::  82%|########1 | 25739/31509 [00:42<00:07, 731.98it/s]","\rparsing log, completed traces ::  82%|########1 | 25813/31509 [00:42<00:07, 721.11it/s]","\rparsing log, completed traces ::  82%|########2 | 25886/31509 [00:42<00:07, 722.83it/s]","\rparsing log, completed traces ::  82%|########2 | 25959/31509 [00:42<00:07, 720.07it/s]","\rparsing log, completed traces ::  83%|########2 | 26032/31509 [00:42<00:07, 713.14it/s]","\rparsing log, completed traces ::  83%|########2 | 26104/31509 [00:42<00:07, 707.94it/s]","\rparsing log, completed traces ::  83%|########3 | 26180/31509 [00:43<00:07, 722.23it/s]","\rparsing log, completed traces ::  83%|########3 | 26253/31509 [00:43<00:07, 719.38it/s]","\rparsing log, completed traces ::  84%|########3 | 26328/31509 [00:43<00:07, 726.18it/s]","\rparsing log, completed traces ::  84%|########3 | 26404/31509 [00:43<00:06, 735.48it/s]","\rparsing log, completed traces ::  84%|########4 | 26478/31509 [00:44<00:26, 189.00it/s]","\rparsing log, completed traces ::  84%|########4 | 26544/31509 [00:44<00:21, 235.00it/s]","\rparsing log, completed traces ::  84%|########4 | 26612/31509 [00:44<00:16, 289.59it/s]","\rparsing log, completed traces ::  85%|########4 | 26686/31509 [00:44<00:13, 356.51it/s]","\rparsing log, completed traces ::  85%|########4 | 26761/31509 [00:44<00:11, 425.59it/s]","\rparsing log, completed traces ::  85%|########5 | 26835/31509 [00:44<00:09, 487.60it/s]","\rparsing log, completed traces ::  85%|########5 | 26905/31509 [00:45<00:08, 533.42it/s]","\rparsing log, completed traces ::  86%|########5 | 26975/31509 [00:45<00:07, 571.51it/s]","\rparsing log, completed traces ::  86%|########5 | 27045/31509 [00:45<00:07, 598.39it/s]","\rparsing log, completed traces ::  86%|########6 | 27117/31509 [00:45<00:06, 629.87it/s]","\rparsing log, completed traces ::  86%|########6 | 27191/31509 [00:45<00:06, 656.40it/s]","\rparsing log, completed traces ::  87%|########6 | 27269/31509 [00:45<00:06, 689.44it/s]","\rparsing log, completed traces ::  87%|########6 | 27342/31509 [00:45<00:06, 679.29it/s]","\rparsing log, completed traces ::  87%|########7 | 27416/31509 [00:45<00:05, 695.95it/s]","\rparsing log, completed traces ::  87%|########7 | 27488/31509 [00:45<00:05, 701.95it/s]","\rparsing log, completed traces ::  87%|########7 | 27562/31509 [00:46<00:05, 711.74it/s]","\rparsing log, completed traces ::  88%|########7 | 27635/31509 [00:46<00:05, 716.90it/s]","\rparsing log, completed traces ::  88%|########7 | 27712/31509 [00:46<00:05, 731.78it/s]","\rparsing log, completed traces ::  88%|########8 | 27788/31509 [00:46<00:05, 739.38it/s]","\rparsing log, completed traces ::  88%|########8 | 27863/31509 [00:46<00:05, 720.80it/s]","\rparsing log, completed traces ::  89%|########8 | 27936/31509 [00:46<00:04, 723.25it/s]","\rparsing log, completed traces ::  89%|########8 | 28010/31509 [00:46<00:04, 724.86it/s]","\rparsing log, completed traces ::  89%|########9 | 28083/31509 [00:46<00:04, 715.81it/s]","\rparsing log, completed traces ::  89%|########9 | 28155/31509 [00:46<00:04, 709.77it/s]","\rparsing log, completed traces ::  90%|########9 | 28229/31509 [00:46<00:04, 717.14it/s]","\rparsing log, completed traces ::  90%|########9 | 28301/31509 [00:47<00:04, 716.78it/s]","\rparsing log, completed traces ::  90%|######### | 28376/31509 [00:47<00:04, 724.06it/s]","\rparsing log, completed traces ::  90%|######### | 28449/31509 [00:47<00:04, 706.57it/s]","\rparsing log, completed traces ::  91%|######### | 28526/31509 [00:47<00:04, 724.38it/s]","\rparsing log, completed traces ::  91%|######### | 28603/31509 [00:47<00:03, 733.38it/s]","\rparsing log, completed traces ::  91%|#########1| 28677/31509 [00:47<00:03, 722.02it/s]","\rparsing log, completed traces ::  91%|#########1| 28750/31509 [00:47<00:04, 686.16it/s]","\rparsing log, completed traces ::  91%|#########1| 28820/31509 [00:47<00:03, 680.87it/s]","\rparsing log, completed traces ::  92%|#########1| 28889/31509 [00:47<00:03, 664.93it/s]","\rparsing log, completed traces ::  92%|#########1| 28963/31509 [00:47<00:03, 685.23it/s]","\rparsing log, completed traces ::  92%|#########2| 29037/31509 [00:48<00:03, 697.16it/s]","\rparsing log, completed traces ::  92%|#########2| 29107/31509 [00:48<00:03, 684.53it/s]","\rparsing log, completed traces ::  93%|#########2| 29185/31509 [00:48<00:03, 712.09it/s]","\rparsing log, completed traces ::  93%|#########2| 29257/31509 [00:48<00:03, 713.38it/s]","\rparsing log, completed traces ::  93%|#########3| 29329/31509 [00:48<00:03, 711.25it/s]","\rparsing log, completed traces ::  93%|#########3| 29401/31509 [00:48<00:03, 693.58it/s]","\rparsing log, completed traces ::  94%|#########3| 29471/31509 [00:48<00:02, 684.57it/s]","\rparsing log, completed traces ::  94%|#########3| 29540/31509 [00:48<00:02, 666.28it/s]","\rparsing log, completed traces ::  94%|#########3| 29613/31509 [00:48<00:02, 681.89it/s]","\rparsing log, completed traces ::  94%|#########4| 29687/31509 [00:49<00:02, 696.83it/s]","\rparsing log, completed traces ::  94%|#########4| 29760/31509 [00:49<00:02, 701.70it/s]","\rparsing log, completed traces ::  95%|#########4| 29831/31509 [00:49<00:02, 694.86it/s]","\rparsing log, completed traces ::  95%|#########4| 29903/31509 [00:49<00:02, 701.10it/s]","\rparsing log, completed traces ::  95%|#########5| 29974/31509 [00:49<00:02, 703.36it/s]","\rparsing log, completed traces ::  95%|#########5| 30045/31509 [00:49<00:02, 703.49it/s]","\rparsing log, completed traces ::  96%|#########5| 30120/31509 [00:49<00:01, 712.93it/s]","\rparsing log, completed traces ::  96%|#########5| 30193/31509 [00:49<00:01, 716.16it/s]","\rparsing log, completed traces ::  96%|#########6| 30267/31509 [00:49<00:01, 720.84it/s]","\rparsing log, completed traces ::  96%|#########6| 30342/31509 [00:49<00:01, 726.86it/s]","\rparsing log, completed traces ::  97%|#########6| 30420/31509 [00:50<00:01, 738.84it/s]","\rparsing log, completed traces ::  97%|#########6| 30494/31509 [00:50<00:01, 735.85it/s]","\rparsing log, completed traces ::  97%|#########7| 30570/31509 [00:50<00:01, 742.74it/s]","\rparsing log, completed traces ::  97%|#########7| 30645/31509 [00:50<00:01, 744.64it/s]","\rparsing log, completed traces ::  97%|#########7| 30720/31509 [00:50<00:01, 744.09it/s]","\rparsing log, completed traces ::  98%|#########7| 30795/31509 [00:50<00:00, 732.27it/s]","\rparsing log, completed traces ::  98%|#########7| 30869/31509 [00:50<00:00, 727.54it/s]","\rparsing log, completed traces ::  98%|#########8| 30942/31509 [00:51<00:03, 172.51it/s]","\rparsing log, completed traces ::  98%|#########8| 31017/31509 [00:51<00:02, 224.62it/s]","\rparsing log, completed traces ::  99%|#########8| 31092/31509 [00:52<00:01, 284.59it/s]","\rparsing log, completed traces ::  99%|#########8| 31167/31509 [00:52<00:00, 349.74it/s]","\rparsing log, completed traces ::  99%|#########9| 31242/31509 [00:52<00:00, 415.68it/s]","\rparsing log, completed traces ::  99%|#########9| 31312/31509 [00:52<00:00, 457.32it/s]","\rparsing log, completed traces :: 100%|#########9| 31381/31509 [00:52<00:00, 506.15it/s]","\rparsing log, completed traces :: 100%|#########9| 31454/31509 [00:52<00:00, 557.76it/s]","","\rparsing log, completed traces :: 100%|##########| 31509/31509 [00:52<00:00, 598.61it/s]","\n","[data] Loaded BPI2017: BPI_Challenge_2017.xes, events=1202267","\n","[data] Loading XES: /workspace/data/Road_Traffic_Fine_Management_Process.xes","\n","\rparsing log, completed traces ::   0%|          | 0/150370 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 659/150370 [00:00<00:22, 6584.95it/s]","\rparsing log, completed traces ::   1%|          | 1410/150370 [00:00<00:21, 7089.88it/s]","\rparsing log, completed traces ::   1%|1         | 2163/150370 [00:00<00:20, 7260.02it/s]","\rparsing log, completed traces ::   2%|1         | 2901/150370 [00:00<00:20, 7307.10it/s]","\rparsing log, completed traces ::   2%|2         | 3632/150370 [00:00<00:20, 7255.12it/s]","\rparsing log, completed traces ::   3%|2         | 4377/150370 [00:00<00:19, 7319.26it/s]","\rparsing log, completed traces ::   3%|3         | 5109/150370 [00:01<00:40, 3619.58it/s]","\rparsing log, completed traces ::   4%|3         | 5836/150370 [00:01<00:33, 4297.52it/s]","\rparsing log, completed traces ::   4%|4         | 6562/150370 [00:01<00:29, 4921.21it/s]","\rparsing log, completed traces ::   5%|4         | 7292/150370 [00:01<00:26, 5462.90it/s]","\rparsing log, completed traces ::   5%|5         | 8068/150370 [00:01<00:23, 6032.40it/s]","\rparsing log, completed traces ::   6%|5         | 8846/150370 [00:01<00:21, 6487.95it/s]","\rparsing log, completed traces ::   6%|6         | 9615/150370 [00:01<00:20, 6811.89it/s]","\rparsing log, completed traces ::   7%|6         | 10380/150370 [00:01<00:19, 7034.61it/s]","\rparsing log, completed traces ::   7%|7         | 11136/150370 [00:01<00:19, 7182.69it/s]","\rparsing log, completed traces ::   8%|7         | 11884/150370 [00:01<00:19, 7247.94it/s]","\rparsing log, completed traces ::   8%|8         | 12631/150370 [00:02<00:18, 7310.85it/s]","\rparsing log, completed traces ::   9%|8         | 13397/150370 [00:02<00:18, 7412.15it/s]","\rparsing log, completed traces ::   9%|9         | 14149/150370 [00:02<00:18, 7390.30it/s]","\rparsing log, completed traces ::  10%|9         | 14900/150370 [00:02<00:18, 7424.58it/s]","\rparsing log, completed traces ::  10%|#         | 15685/150370 [00:02<00:17, 7549.44it/s]","\rparsing log, completed traces ::  11%|#         | 16487/150370 [00:02<00:17, 7688.70it/s]","\rparsing log, completed traces ::  11%|#1        | 17278/150370 [00:02<00:17, 7753.78it/s]","\rparsing log, completed traces ::  12%|#2        | 18056/150370 [00:03<00:35, 3716.41it/s]","\rparsing log, completed traces ::  13%|#2        | 18843/150370 [00:03<00:29, 4421.17it/s]","\rparsing log, completed traces ::  13%|#3        | 19610/150370 [00:03<00:25, 5054.89it/s]","\rparsing log, completed traces ::  14%|#3        | 20370/150370 [00:03<00:23, 5609.35it/s]","\rparsing log, completed traces ::  14%|#4        | 21179/150370 [00:03<00:20, 6198.35it/s]","\rparsing log, completed traces ::  15%|#4        | 21996/150370 [00:03<00:19, 6696.05it/s]","\rparsing log, completed traces ::  15%|#5        | 22827/150370 [00:03<00:17, 7119.61it/s]","\rparsing log, completed traces ::  16%|#5        | 23617/150370 [00:03<00:17, 7333.36it/s]","\rparsing log, completed traces ::  16%|#6        | 24402/150370 [00:03<00:17, 6998.53it/s]","\rparsing log, completed traces ::  17%|#6        | 25141/150370 [00:04<00:18, 6827.86it/s]","\rparsing log, completed traces ::  17%|#7        | 25851/150370 [00:04<00:18, 6666.05it/s]","\rparsing log, completed traces ::  18%|#7        | 26537/150370 [00:04<00:19, 6473.41it/s]","\rparsing log, completed traces ::  18%|#8        | 27198/150370 [00:04<00:19, 6376.06it/s]","\rparsing log, completed traces ::  19%|#8        | 27845/150370 [00:04<00:19, 6280.53it/s]","\rparsing log, completed traces ::  19%|#8        | 28536/150370 [00:04<00:18, 6446.04it/s]","\rparsing log, completed traces ::  19%|#9        | 29277/150370 [00:04<00:18, 6697.75it/s]","\rparsing log, completed traces ::  20%|#9        | 29981/150370 [00:04<00:17, 6794.78it/s]","\rparsing log, completed traces ::  20%|##        | 30665/150370 [00:05<00:39, 3018.22it/s]","\rparsing log, completed traces ::  21%|##        | 31293/150370 [00:05<00:33, 3526.99it/s]","\rparsing log, completed traces ::  21%|##1       | 31926/150370 [00:05<00:29, 4037.19it/s]","\rparsing log, completed traces ::  22%|##1       | 32565/150370 [00:05<00:26, 4520.74it/s]","\rparsing log, completed traces ::  22%|##2       | 33208/150370 [00:05<00:23, 4955.23it/s]","\rparsing log, completed traces ::  23%|##2       | 33863/150370 [00:05<00:21, 5344.71it/s]","\rparsing log, completed traces ::  23%|##2       | 34497/150370 [00:05<00:20, 5601.99it/s]","\rparsing log, completed traces ::  23%|##3       | 35123/150370 [00:06<00:19, 5769.91it/s]","\rparsing log, completed traces ::  24%|##3       | 35783/150370 [00:06<00:19, 5999.41it/s]","\rparsing log, completed traces ::  24%|##4       | 36503/150370 [00:06<00:17, 6340.44it/s]","\rparsing log, completed traces ::  25%|##4       | 37255/150370 [00:06<00:16, 6679.01it/s]","\rparsing log, completed traces ::  25%|##5       | 37996/150370 [00:06<00:16, 6887.32it/s]","\rparsing log, completed traces ::  26%|##5       | 38772/150370 [00:06<00:15, 7142.92it/s]","\rparsing log, completed traces ::  26%|##6       | 39552/150370 [00:06<00:15, 7336.90it/s]","\rparsing log, completed traces ::  27%|##6       | 40330/150370 [00:06<00:14, 7467.15it/s]","\rparsing log, completed traces ::  27%|##7       | 41116/150370 [00:06<00:14, 7568.89it/s]","\rparsing log, completed traces ::  28%|##7       | 41936/150370 [00:06<00:13, 7749.20it/s]","\rparsing log, completed traces ::  28%|##8       | 42743/150370 [00:07<00:13, 7843.09it/s]","\rparsing log, completed traces ::  29%|##8       | 43545/150370 [00:07<00:13, 7893.69it/s]","\rparsing log, completed traces ::  29%|##9       | 44336/150370 [00:07<00:13, 7897.58it/s]","\rparsing log, completed traces ::  30%|###       | 45127/150370 [00:07<00:30, 3399.68it/s]","\rparsing log, completed traces ::  31%|###       | 45905/150370 [00:07<00:25, 4080.15it/s]","\rparsing log, completed traces ::  31%|###1      | 46665/150370 [00:07<00:21, 4719.58it/s]","\rparsing log, completed traces ::  32%|###1      | 47414/150370 [00:08<00:19, 5290.06it/s]","\rparsing log, completed traces ::  32%|###2      | 48218/150370 [00:08<00:17, 5915.16it/s]","\rparsing log, completed traces ::  33%|###2      | 49125/150370 [00:08<00:15, 6687.84it/s]","\rparsing log, completed traces ::  33%|###3      | 49939/150370 [00:08<00:14, 7064.17it/s]","\rparsing log, completed traces ::  34%|###3      | 50733/150370 [00:08<00:13, 7253.70it/s]","\rparsing log, completed traces ::  34%|###4      | 51522/150370 [00:08<00:13, 7397.47it/s]","\rparsing log, completed traces ::  35%|###4      | 52307/150370 [00:08<00:13, 7485.39it/s]","\rparsing log, completed traces ::  35%|###5      | 53104/150370 [00:08<00:12, 7611.29it/s]","\rparsing log, completed traces ::  36%|###5      | 53889/150370 [00:08<00:12, 7676.81it/s]","\rparsing log, completed traces ::  36%|###6      | 54745/150370 [00:08<00:12, 7920.05it/s]","\rparsing log, completed traces ::  37%|###6      | 55551/150370 [00:09<00:11, 7941.88it/s]","\rparsing log, completed traces ::  38%|###7      | 56395/150370 [00:09<00:11, 8088.39it/s]","\rparsing log, completed traces ::  38%|###8      | 57233/150370 [00:09<00:11, 8168.60it/s]","\rparsing log, completed traces ::  39%|###8      | 58055/150370 [00:09<00:11, 8131.11it/s]","\rparsing log, completed traces ::  39%|###9      | 58872/150370 [00:09<00:11, 8069.40it/s]","\rparsing log, completed traces ::  40%|###9      | 59717/150370 [00:09<00:11, 8181.78it/s]","\rparsing log, completed traces ::  40%|####      | 60537/150370 [00:09<00:11, 8036.46it/s]","\rparsing log, completed traces ::  41%|####      | 61461/150370 [00:09<00:10, 8389.91it/s]","\rparsing log, completed traces ::  41%|####1     | 62372/150370 [00:09<00:10, 8602.88it/s]","\rparsing log, completed traces ::  42%|####2     | 63234/150370 [00:10<00:25, 3416.15it/s]","\rparsing log, completed traces ::  43%|####2     | 64065/150370 [00:10<00:20, 4121.45it/s]","\rparsing log, completed traces ::  43%|####3     | 64892/150370 [00:10<00:17, 4824.18it/s]","\rparsing log, completed traces ::  44%|####3     | 65761/150370 [00:10<00:15, 5578.57it/s]","\rparsing log, completed traces ::  44%|####4     | 66628/150370 [00:10<00:13, 6253.56it/s]","\rparsing log, completed traces ::  45%|####4     | 67552/150370 [00:10<00:11, 6963.39it/s]","\rparsing log, completed traces ::  46%|####5     | 68436/150370 [00:11<00:11, 7438.03it/s]","\rparsing log, completed traces ::  46%|####6     | 69312/150370 [00:11<00:10, 7788.84it/s]","\rparsing log, completed traces ::  47%|####6     | 70172/150370 [00:11<00:10, 7916.26it/s]","\rparsing log, completed traces ::  47%|####7     | 71021/150370 [00:11<00:09, 8069.49it/s]","\rparsing log, completed traces ::  48%|####7     | 71869/150370 [00:11<00:09, 8115.55it/s]","\rparsing log, completed traces ::  48%|####8     | 72710/150370 [00:11<00:09, 8175.88it/s]","\rparsing log, completed traces ::  49%|####8     | 73549/150370 [00:11<00:09, 8020.06it/s]","\rparsing log, completed traces ::  49%|####9     | 74412/150370 [00:11<00:09, 8195.23it/s]","\rparsing log, completed traces ::  50%|#####     | 75320/150370 [00:11<00:08, 8450.74it/s]","\rparsing log, completed traces ::  51%|#####     | 76205/150370 [00:11<00:08, 8536.45it/s]","\rparsing log, completed traces ::  51%|#####1    | 77065/150370 [00:12<00:08, 8541.42it/s]","\rparsing log, completed traces ::  52%|#####1    | 77924/150370 [00:12<00:08, 8448.46it/s]","\rparsing log, completed traces ::  52%|#####2    | 78772/150370 [00:12<00:08, 8370.90it/s]","\rparsing log, completed traces ::  53%|#####2    | 79612/150370 [00:12<00:08, 8295.11it/s]","\rparsing log, completed traces ::  54%|#####3    | 80453/150370 [00:12<00:08, 8323.83it/s]","\rparsing log, completed traces ::  54%|#####4    | 81287/150370 [00:12<00:08, 8274.05it/s]","\rparsing log, completed traces ::  55%|#####4    | 82155/150370 [00:12<00:08, 8392.05it/s]","\rparsing log, completed traces ::  55%|#####5    | 83048/150370 [00:12<00:07, 8551.49it/s]","\rparsing log, completed traces ::  56%|#####5    | 83904/150370 [00:12<00:07, 8515.18it/s]","\rparsing log, completed traces ::  56%|#####6    | 84757/150370 [00:13<00:20, 3144.80it/s]","\rparsing log, completed traces ::  57%|#####6    | 85569/150370 [00:13<00:16, 3819.18it/s]","\rparsing log, completed traces ::  57%|#####7    | 86405/150370 [00:13<00:14, 4555.56it/s]","\rparsing log, completed traces ::  58%|#####8    | 87246/150370 [00:13<00:11, 5280.45it/s]","\rparsing log, completed traces ::  59%|#####8    | 88081/150370 [00:13<00:10, 5929.80it/s]","\rparsing log, completed traces ::  59%|#####9    | 88939/150370 [00:14<00:09, 6544.89it/s]","\rparsing log, completed traces ::  60%|#####9    | 89794/150370 [00:14<00:08, 7033.87it/s]","\rparsing log, completed traces ::  60%|######    | 90635/150370 [00:14<00:08, 7393.34it/s]","\rparsing log, completed traces ::  61%|######    | 91485/150370 [00:14<00:07, 7683.26it/s]","\rparsing log, completed traces ::  61%|######1   | 92333/150370 [00:14<00:07, 7905.28it/s]","\rparsing log, completed traces ::  62%|######1   | 93170/150370 [00:14<00:07, 7977.51it/s]","\rparsing log, completed traces ::  63%|######2   | 94015/150370 [00:14<00:06, 8112.44it/s]","\rparsing log, completed traces ::  63%|######3   | 94902/150370 [00:14<00:06, 8331.23it/s]","\rparsing log, completed traces ::  64%|######3   | 95772/150370 [00:14<00:06, 8439.49it/s]","\rparsing log, completed traces ::  64%|######4   | 96629/150370 [00:14<00:06, 8395.08it/s]","\rparsing log, completed traces ::  65%|######4   | 97477/150370 [00:15<00:06, 8311.64it/s]","\rparsing log, completed traces ::  65%|######5   | 98315/150370 [00:15<00:06, 8324.92it/s]","\rparsing log, completed traces ::  66%|######5   | 99152/150370 [00:15<00:06, 8334.84it/s]","\rparsing log, completed traces ::  66%|######6   | 99989/150370 [00:15<00:06, 8323.99it/s]","\rparsing log, completed traces ::  67%|######7   | 100828/150370 [00:15<00:05, 8332.81it/s]","\rparsing log, completed traces ::  68%|######7   | 101688/150370 [00:15<00:05, 8392.42it/s]","\rparsing log, completed traces ::  68%|######8   | 102549/150370 [00:15<00:05, 8454.82it/s]","\rparsing log, completed traces ::  69%|######8   | 103396/150370 [00:15<00:05, 8413.54it/s]","\rparsing log, completed traces ::  69%|######9   | 104238/150370 [00:15<00:05, 8379.66it/s]","\rparsing log, completed traces ::  70%|######9   | 105077/150370 [00:16<00:05, 8310.95it/s]","\rparsing log, completed traces ::  70%|#######   | 105909/150370 [00:16<00:05, 8303.10it/s]","\rparsing log, completed traces ::  71%|#######   | 106740/150370 [00:16<00:05, 8275.90it/s]","\rparsing log, completed traces ::  72%|#######1  | 107568/150370 [00:16<00:05, 8270.29it/s]","\rparsing log, completed traces ::  72%|#######2  | 108396/150370 [00:16<00:05, 8180.42it/s]","\rparsing log, completed traces ::  73%|#######2  | 109215/150370 [00:16<00:05, 8171.86it/s]","\rparsing log, completed traces ::  73%|#######3  | 110033/150370 [00:17<00:14, 2773.47it/s]","\rparsing log, completed traces ::  74%|#######3  | 110847/150370 [00:17<00:11, 3448.31it/s]","\rparsing log, completed traces ::  74%|#######4  | 111671/150370 [00:17<00:09, 4178.38it/s]","\rparsing log, completed traces ::  75%|#######4  | 112478/150370 [00:17<00:07, 4874.03it/s]","\rparsing log, completed traces ::  75%|#######5  | 113265/150370 [00:17<00:06, 5482.87it/s]","\rparsing log, completed traces ::  76%|#######5  | 114251/150370 [00:17<00:05, 6453.05it/s]","\rparsing log, completed traces ::  77%|#######6  | 115258/150370 [00:17<00:04, 7329.05it/s]","\rparsing log, completed traces ::  77%|#######7  | 116253/150370 [00:17<00:04, 8003.56it/s]","\rparsing log, completed traces ::  78%|#######8  | 117390/150370 [00:18<00:03, 8908.24it/s]","\rparsing log, completed traces ::  79%|#######8  | 118370/150370 [00:18<00:03, 8515.45it/s]","\rparsing log, completed traces ::  79%|#######9  | 119287/150370 [00:18<00:03, 8267.23it/s]","\rparsing log, completed traces ::  80%|#######9  | 120160/150370 [00:18<00:03, 8118.14it/s]","\rparsing log, completed traces ::  80%|########  | 121004/150370 [00:18<00:03, 7983.36it/s]","\rparsing log, completed traces ::  81%|########1 | 121825/150370 [00:18<00:03, 7911.04it/s]","\rparsing log, completed traces ::  82%|########1 | 122632/150370 [00:18<00:03, 7848.00it/s]","\rparsing log, completed traces ::  82%|########2 | 123427/150370 [00:18<00:03, 7724.52it/s]","\rparsing log, completed traces ::  83%|########2 | 124207/150370 [00:18<00:03, 7658.62it/s]","\rparsing log, completed traces ::  83%|########3 | 124978/150370 [00:19<00:03, 7636.70it/s]","\rparsing log, completed traces ::  84%|########3 | 125763/150370 [00:19<00:03, 7696.64it/s]","\rparsing log, completed traces ::  84%|########4 | 126554/150370 [00:19<00:03, 7757.82it/s]","\rparsing log, completed traces ::  85%|########4 | 127362/150370 [00:19<00:02, 7852.53it/s]","\rparsing log, completed traces ::  85%|########5 | 128149/150370 [00:19<00:02, 7845.65it/s]","\rparsing log, completed traces ::  86%|########5 | 128961/150370 [00:19<00:02, 7902.05it/s]","\rparsing log, completed traces ::  86%|########6 | 129769/150370 [00:19<00:02, 7935.13it/s]","\rparsing log, completed traces ::  87%|########6 | 130564/150370 [00:19<00:02, 7926.67it/s]","\rparsing log, completed traces ::  87%|########7 | 131363/150370 [00:19<00:02, 7945.16it/s]","\rparsing log, completed traces ::  88%|########7 | 132296/150370 [00:19<00:02, 8358.28it/s]","\rparsing log, completed traces ::  89%|########8 | 133193/150370 [00:20<00:02, 8540.73it/s]","\rparsing log, completed traces ::  89%|########9 | 134048/150370 [00:20<00:01, 8451.63it/s]","\rparsing log, completed traces ::  90%|########9 | 134894/150370 [00:20<00:01, 8369.52it/s]","\rparsing log, completed traces ::  90%|######### | 135732/150370 [00:20<00:01, 8221.82it/s]","\rparsing log, completed traces ::  91%|######### | 136555/150370 [00:20<00:01, 8153.89it/s]","\rparsing log, completed traces ::  91%|#########1| 137371/150370 [00:20<00:01, 8019.64it/s]","\rparsing log, completed traces ::  92%|#########1| 138174/150370 [00:21<00:04, 2521.80it/s]","\rparsing log, completed traces ::  92%|#########2| 138989/150370 [00:21<00:03, 3173.93it/s]","\rparsing log, completed traces ::  93%|#########2| 139778/150370 [00:21<00:02, 3842.83it/s]","\rparsing log, completed traces ::  94%|#########3| 140634/150370 [00:21<00:02, 4633.08it/s]","\rparsing log, completed traces ::  94%|#########4| 141455/150370 [00:21<00:01, 5317.56it/s]","\rparsing log, completed traces ::  95%|#########4| 142292/150370 [00:21<00:01, 5970.84it/s]","\rparsing log, completed traces ::  95%|#########5| 143099/150370 [00:22<00:01, 6465.86it/s]","\rparsing log, completed traces ::  96%|#########5| 143934/150370 [00:22<00:00, 6926.98it/s]","\rparsing log, completed traces ::  96%|#########6| 144750/150370 [00:22<00:00, 7227.52it/s]","\rparsing log, completed traces ::  97%|#########6| 145554/150370 [00:22<00:00, 7106.84it/s]","\rparsing log, completed traces ::  97%|#########7| 146322/150370 [00:22<00:00, 6888.50it/s]","\rparsing log, completed traces ::  98%|#########7| 147052/150370 [00:22<00:00, 6783.14it/s]","\rparsing log, completed traces ::  98%|#########8| 147759/150370 [00:22<00:00, 6718.88it/s]","\rparsing log, completed traces ::  99%|#########8| 148451/150370 [00:22<00:00, 6693.12it/s]","\rparsing log, completed traces ::  99%|#########9| 149163/150370 [00:22<00:00, 6811.36it/s]","\rparsing log, completed traces :: 100%|#########9| 149929/150370 [00:23<00:00, 7050.36it/s]","","\rparsing log, completed traces :: 100%|##########| 150370/150370 [00:23<00:00, 6519.28it/s]","\n","[data] Loaded ROAD: Road_Traffic_Fine_Management_Process.xes, events=561470","\n","[BPI2012] samples train/val/test: 39001/8312/8991, vocab=23","\n","[BPI2012][bs=64, lr=0.0005] Epoch 1: validation_loss = 0.5664 acc=0.7585 f1=0.4002 top3=0.9793 ece=0.0400","\n","[BPI2012][bs=64, lr=0.0005] Epoch 2: validation_loss = 0.5367 acc=0.7741 f1=0.4369 top3=0.9811 ece=0.0245","\n","[BPI2012][bs=64, lr=0.0005] Epoch 3: validation_loss = 0.5302 acc=0.7779 f1=0.4844 top3=0.9803 ece=0.0249","\n","[BPI2012][bs=64, lr=0.0005] Epoch 4: validation_loss = 0.5296 acc=0.7802 f1=0.4766 top3=0.9797 ece=0.0207","\n","[BPI2012][bs=64, lr=0.0005] Epoch 5: validation_loss = 0.5226 acc=0.7824 f1=0.5039 top3=0.9804 ece=0.0114","\n","[BPI2012][bs=64, lr=0.0005] Epoch 6: validation_loss = 0.5225 acc=0.7688 f1=0.4848 top3=0.9803 ece=0.0212","\n","[BPI2012][bs=64, lr=0.0005] Epoch 7: validation_loss = 0.5222 acc=0.7838 f1=0.5036 top3=0.9804 ece=0.0111","\n","[BPI2012][bs=64, lr=0.0005] Epoch 8: validation_loss = 0.5242 acc=0.7623 f1=0.4640 top3=0.9801 ece=0.0184","\n","[BPI2012][bs=64, lr=0.0005] Epoch 9: validation_loss = 0.5183 acc=0.7842 f1=0.5014 top3=0.9816 ece=0.0178","\n","[BPI2012][bs=64, lr=0.0005] Epoch 10: validation_loss = 0.5152 acc=0.7839 f1=0.4944 top3=0.9806 ece=0.0163","\n","[BPI2012][bs=64, lr=0.0005] Epoch 11: validation_loss = 0.5202 acc=0.7774 f1=0.4875 top3=0.9804 ece=0.0183","\n","[BPI2012][bs=64, lr=0.0005] Epoch 12: validation_loss = 0.5165 acc=0.7837 f1=0.4968 top3=0.9804 ece=0.0213","\n","[BPI2012] samples train/val/test: 39001/8312/8991, vocab=23","\n","[BPI2012][bs=64, lr=0.001] Epoch 1: validation_loss = 0.5503 acc=0.7587 f1=0.4562 top3=0.9791 ece=0.0428","\n","[BPI2012][bs=64, lr=0.001] Epoch 2: validation_loss = 0.5358 acc=0.7709 f1=0.4741 top3=0.9809 ece=0.0261","\n","[BPI2012][bs=64, lr=0.001] Epoch 3: validation_loss = 0.5259 acc=0.7821 f1=0.5082 top3=0.9811 ece=0.0179","\n","[BPI2012][bs=64, lr=0.001] Epoch 4: validation_loss = 0.5308 acc=0.7668 f1=0.4878 top3=0.9812 ece=0.0202","\n","[BPI2012][bs=64, lr=0.001] Epoch 5: validation_loss = 0.5252 acc=0.7747 f1=0.4944 top3=0.9815 ece=0.0148","\n","[BPI2012][bs=64, lr=0.001] Epoch 6: validation_loss = 0.5223 acc=0.7776 f1=0.5207 top3=0.9816 ece=0.0257","\n","[BPI2012][bs=64, lr=0.001] Epoch 7: validation_loss = 0.5187 acc=0.7830 f1=0.4795 top3=0.9803 ece=0.0183","\n","[BPI2012][bs=64, lr=0.001] Epoch 8: validation_loss = 0.5185 acc=0.7843 f1=0.5143 top3=0.9795 ece=0.0233","\n","[BPI2012][bs=64, lr=0.001] Epoch 9: validation_loss = 0.5204 acc=0.7778 f1=0.5143 top3=0.9803 ece=0.0215","\n","[BPI2012][bs=64, lr=0.001] Epoch 10: validation_loss = 0.5234 acc=0.7730 f1=0.5193 top3=0.9810 ece=0.0241","\n","[BPI2012][bs=64, lr=0.001] Epoch 11: validation_loss = 0.5208 acc=0.7804 f1=0.5160 top3=0.9817 ece=0.0318","\n","[BPI2012][bs=64, lr=0.001] Epoch 12: validation_loss = 0.5137 acc=0.7777 f1=0.4860 top3=0.9800 ece=0.0219","\n","[BPI2012] samples train/val/test: 39001/8312/8991, vocab=23","\n","[BPI2012][bs=128, lr=0.0005] Epoch 1: validation_loss = 0.5834 acc=0.7650 f1=0.3951 top3=0.9759 ece=0.0264","\n","[BPI2012][bs=128, lr=0.0005] Epoch 2: validation_loss = 0.5466 acc=0.7723 f1=0.4202 top3=0.9794 ece=0.0270","\n","[BPI2012][bs=128, lr=0.0005] Epoch 3: validation_loss = 0.5379 acc=0.7767 f1=0.4396 top3=0.9809 ece=0.0364","\n","[BPI2012][bs=128, lr=0.0005] Epoch 4: validation_loss = 0.5312 acc=0.7784 f1=0.4590 top3=0.9795 ece=0.0279","\n","[BPI2012][bs=128, lr=0.0005] Epoch 5: validation_loss = 0.5254 acc=0.7774 f1=0.4751 top3=0.9798 ece=0.0198","\n","[BPI2012][bs=128, lr=0.0005] Epoch 6: validation_loss = 0.5255 acc=0.7783 f1=0.4758 top3=0.9799 ece=0.0141","\n","[BPI2012][bs=128, lr=0.0005] Epoch 7: validation_loss = 0.5224 acc=0.7776 f1=0.4975 top3=0.9803 ece=0.0130","\n","[BPI2012][bs=128, lr=0.0005] Epoch 8: validation_loss = 0.5215 acc=0.7798 f1=0.4997 top3=0.9805 ece=0.0154","\n","[BPI2012][bs=128, lr=0.0005] Epoch 9: validation_loss = 0.5194 acc=0.7791 f1=0.5027 top3=0.9806 ece=0.0166","\n","[BPI2012][bs=128, lr=0.0005] Epoch 10: validation_loss = 0.5209 acc=0.7828 f1=0.4932 top3=0.9803 ece=0.0161","\n","[BPI2012][bs=128, lr=0.0005] Epoch 11: validation_loss = 0.5232 acc=0.7780 f1=0.4894 top3=0.9809 ece=0.0250","\n","[BPI2012][bs=128, lr=0.0005] Epoch 12: validation_loss = 0.5183 acc=0.7776 f1=0.4771 top3=0.9814 ece=0.0277","\n","[BPI2012] samples train/val/test: 39001/8312/8991, vocab=23","\n","[BPI2012][bs=128, lr=0.001] Epoch 1: validation_loss = 0.5520 acc=0.7724 f1=0.4225 top3=0.9780 ece=0.0180","\n","[BPI2012][bs=128, lr=0.001] Epoch 2: validation_loss = 0.5367 acc=0.7689 f1=0.4327 top3=0.9799 ece=0.0239","\n","[BPI2012][bs=128, lr=0.001] Epoch 3: validation_loss = 0.5301 acc=0.7662 f1=0.4729 top3=0.9803 ece=0.0254","\n","[BPI2012][bs=128, lr=0.001] Epoch 4: validation_loss = 0.5282 acc=0.7788 f1=0.4961 top3=0.9809 ece=0.0212","\n","[BPI2012][bs=128, lr=0.001] Epoch 5: validation_loss = 0.5253 acc=0.7813 f1=0.4910 top3=0.9810 ece=0.0218","\n","[BPI2012][bs=128, lr=0.001] Epoch 6: validation_loss = 0.5247 acc=0.7742 f1=0.4480 top3=0.9804 ece=0.0316","\n","[BPI2012][bs=128, lr=0.001] Epoch 7: validation_loss = 0.5215 acc=0.7771 f1=0.4767 top3=0.9803 ece=0.0256","\n","[BPI2012][bs=128, lr=0.001] Epoch 8: validation_loss = 0.5204 acc=0.7827 f1=0.4919 top3=0.9816 ece=0.0217","\n","[BPI2012][bs=128, lr=0.001] Epoch 9: validation_loss = 0.5169 acc=0.7772 f1=0.4995 top3=0.9803 ece=0.0143","\n","[BPI2012][bs=128, lr=0.001] Epoch 10: validation_loss = 0.5179 acc=0.7819 f1=0.4989 top3=0.9804 ece=0.0193","\n","[BPI2012][bs=128, lr=0.001] Epoch 11: validation_loss = 0.5153 acc=0.7692 f1=0.4805 top3=0.9803 ece=0.0163","\n","[BPI2012][bs=128, lr=0.001] Epoch 12: validation_loss = 0.5140 acc=0.7780 f1=0.4969 top3=0.9809 ece=0.0229","\n","[BPI2012] samples train/val/test: 39001/8312/8991, vocab=23","\n","[BPI2012][bs=256, lr=0.0005] Epoch 1: validation_loss = 0.6620 acc=0.7636 f1=0.3431 top3=0.9703 ece=0.0827","\n","[BPI2012][bs=256, lr=0.0005] Epoch 2: validation_loss = 0.5762 acc=0.7709 f1=0.3942 top3=0.9767 ece=0.0319","\n","[BPI2012][bs=256, lr=0.0005] Epoch 3: validation_loss = 0.5552 acc=0.7718 f1=0.4056 top3=0.9785 ece=0.0318","\n","[BPI2012][bs=256, lr=0.0005] Epoch 4: validation_loss = 0.5422 acc=0.7623 f1=0.4165 top3=0.9797 ece=0.0229","\n","[BPI2012][bs=256, lr=0.0005] Epoch 5: validation_loss = 0.5386 acc=0.7747 f1=0.4342 top3=0.9797 ece=0.0231","\n","[BPI2012][bs=256, lr=0.0005] Epoch 6: validation_loss = 0.5320 acc=0.7816 f1=0.4460 top3=0.9804 ece=0.0204","\n","[BPI2012][bs=256, lr=0.0005] Epoch 7: validation_loss = 0.5305 acc=0.7777 f1=0.4427 top3=0.9805 ece=0.0136","\n","[BPI2012][bs=256, lr=0.0005] Epoch 8: validation_loss = 0.5280 acc=0.7763 f1=0.4653 top3=0.9805 ece=0.0141","\n","[BPI2012][bs=256, lr=0.0005] Epoch 9: validation_loss = 0.5263 acc=0.7769 f1=0.4656 top3=0.9795 ece=0.0211","\n","[BPI2012][bs=256, lr=0.0005] Epoch 10: validation_loss = 0.5287 acc=0.7838 f1=0.4962 top3=0.9803 ece=0.0234","\n","[BPI2012][bs=256, lr=0.0005] Epoch 11: validation_loss = 0.5225 acc=0.7828 f1=0.4956 top3=0.9800 ece=0.0159","\n","[BPI2012][bs=256, lr=0.0005] Epoch 12: validation_loss = 0.5225 acc=0.7826 f1=0.4923 top3=0.9803 ece=0.0216","\n","[BPI2012] samples train/val/test: 39001/8312/8991, vocab=23","\n","[BPI2012][bs=256, lr=0.001] Epoch 1: validation_loss = 0.5782 acc=0.7701 f1=0.3947 top3=0.9782 ece=0.0340","\n","[BPI2012][bs=256, lr=0.001] Epoch 2: validation_loss = 0.5414 acc=0.7754 f1=0.4287 top3=0.9797 ece=0.0268","\n","[BPI2012][bs=256, lr=0.001] Epoch 3: validation_loss = 0.5333 acc=0.7800 f1=0.4402 top3=0.9804 ece=0.0332","\n","[BPI2012][bs=256, lr=0.001] Epoch 4: validation_loss = 0.5291 acc=0.7832 f1=0.4785 top3=0.9805 ece=0.0185","\n","[BPI2012][bs=256, lr=0.001] Epoch 5: validation_loss = 0.5260 acc=0.7824 f1=0.4914 top3=0.9801 ece=0.0219","\n","[BPI2012][bs=256, lr=0.001] Epoch 6: validation_loss = 0.5254 acc=0.7801 f1=0.5001 top3=0.9809 ece=0.0255","\n","[BPI2012][bs=256, lr=0.001] Epoch 7: validation_loss = 0.5217 acc=0.7777 f1=0.4990 top3=0.9811 ece=0.0238","\n","[BPI2012][bs=256, lr=0.001] Epoch 8: validation_loss = 0.5221 acc=0.7790 f1=0.5032 top3=0.9794 ece=0.0155","\n","[BPI2012][bs=256, lr=0.001] Epoch 9: validation_loss = 0.5180 acc=0.7783 f1=0.5008 top3=0.9801 ece=0.0133","\n","[BPI2012][bs=256, lr=0.001] Epoch 10: validation_loss = 0.5189 acc=0.7694 f1=0.4956 top3=0.9809 ece=0.0193","\n","[BPI2012][bs=256, lr=0.001] Epoch 11: validation_loss = 0.5173 acc=0.7831 f1=0.4954 top3=0.9799 ece=0.0125","\n","[BPI2012][bs=256, lr=0.001] Epoch 12: validation_loss = 0.5164 acc=0.7779 f1=0.4885 top3=0.9812 ece=0.0231","\n","[BPI2012] Best setting: bs=64 lr=0.001 | val_top3=0.9817 | test_acc=0.7787 test_top3=0.9795 ece=0.0241","\n","[BPI2017] samples train/val/test: 63477/13508/13494, vocab=24","\n","[BPI2017][bs=64, lr=0.0005] Epoch 1: validation_loss = 0.4055 acc=0.8335 f1=0.5762 top3=0.9866 ece=0.0210","\n","[BPI2017][bs=64, lr=0.0005] Epoch 2: validation_loss = 0.3971 acc=0.8338 f1=0.5642 top3=0.9870 ece=0.0262","\n","[BPI2017][bs=64, lr=0.0005] Epoch 3: validation_loss = 0.3908 acc=0.8308 f1=0.5762 top3=0.9863 ece=0.0174","\n","[BPI2017][bs=64, lr=0.0005] Epoch 4: validation_loss = 0.3905 acc=0.8387 f1=0.5921 top3=0.9867 ece=0.0121","\n","[BPI2017][bs=64, lr=0.0005] Epoch 5: validation_loss = 0.3870 acc=0.8330 f1=0.5910 top3=0.9862 ece=0.0109","\n","[BPI2017][bs=64, lr=0.0005] Epoch 6: validation_loss = 0.3843 acc=0.8357 f1=0.5948 top3=0.9856 ece=0.0097","\n","[BPI2017][bs=64, lr=0.0005] Epoch 7: validation_loss = 0.3860 acc=0.8355 f1=0.5826 top3=0.9879 ece=0.0173","\n","[BPI2017][bs=64, lr=0.0005] Epoch 8: validation_loss = 0.3845 acc=0.8305 f1=0.5890 top3=0.9883 ece=0.0114","\n","[BPI2017][bs=64, lr=0.0005] Epoch 9: validation_loss = 0.3838 acc=0.8334 f1=0.5962 top3=0.9868 ece=0.0098","\n","[BPI2017][bs=64, lr=0.0005] Epoch 10: validation_loss = 0.3859 acc=0.8349 f1=0.5985 top3=0.9873 ece=0.0230","\n","[BPI2017][bs=64, lr=0.0005] Epoch 11: validation_loss = 0.3816 acc=0.8355 f1=0.6002 top3=0.9862 ece=0.0080","\n","[BPI2017][bs=64, lr=0.0005] Epoch 12: validation_loss = 0.3862 acc=0.8305 f1=0.5973 top3=0.9885 ece=0.0231","\n","[BPI2017] samples train/val/test: 63477/13508/13494, vocab=24","\n","[BPI2017][bs=64, lr=0.001] Epoch 1: validation_loss = 0.3987 acc=0.8326 f1=0.5849 top3=0.9875 ece=0.0224","\n","[BPI2017][bs=64, lr=0.001] Epoch 2: validation_loss = 0.3948 acc=0.8337 f1=0.5875 top3=0.9871 ece=0.0199","\n","[BPI2017][bs=64, lr=0.001] Epoch 3: validation_loss = 0.3984 acc=0.8345 f1=0.6002 top3=0.9863 ece=0.0208","\n","[BPI2017][bs=64, lr=0.001] Epoch 4: validation_loss = 0.3914 acc=0.8303 f1=0.5863 top3=0.9861 ece=0.0187","\n","[BPI2017][bs=64, lr=0.001] Epoch 5: validation_loss = 0.3920 acc=0.8297 f1=0.5831 top3=0.9856 ece=0.0168","\n","[BPI2017][bs=64, lr=0.001] Epoch 6: validation_loss = 0.3879 acc=0.8365 f1=0.5901 top3=0.9861 ece=0.0258","\n","[BPI2017][bs=64, lr=0.001] Epoch 7: validation_loss = 0.3873 acc=0.8359 f1=0.6041 top3=0.9873 ece=0.0211","\n","[BPI2017][bs=64, lr=0.001] Epoch 8: validation_loss = 0.3863 acc=0.8371 f1=0.5997 top3=0.9885 ece=0.0142","\n","[BPI2017][bs=64, lr=0.001] Epoch 9: validation_loss = 0.3862 acc=0.8361 f1=0.5991 top3=0.9877 ece=0.0169","\n","[BPI2017][bs=64, lr=0.001] Epoch 10: validation_loss = 0.3831 acc=0.8374 f1=0.6027 top3=0.9876 ece=0.0169","\n","[BPI2017][bs=64, lr=0.001] Epoch 11: validation_loss = 0.3811 acc=0.8362 f1=0.6036 top3=0.9876 ece=0.0082","\n","[BPI2017][bs=64, lr=0.001] Epoch 12: validation_loss = 0.3867 acc=0.8362 f1=0.5962 top3=0.9886 ece=0.0172","\n","[BPI2017] samples train/val/test: 63477/13508/13494, vocab=24","\n","[BPI2017][bs=128, lr=0.0005] Epoch 1: validation_loss = 0.4223 acc=0.8318 f1=0.5627 top3=0.9850 ece=0.0275","\n","[BPI2017][bs=128, lr=0.0005] Epoch 2: validation_loss = 0.4044 acc=0.8241 f1=0.5583 top3=0.9856 ece=0.0265","\n","[BPI2017][bs=128, lr=0.0005] Epoch 3: validation_loss = 0.4018 acc=0.8279 f1=0.5844 top3=0.9847 ece=0.0138","\n","[BPI2017][bs=128, lr=0.0005] Epoch 4: validation_loss = 0.4079 acc=0.8228 f1=0.5688 top3=0.9861 ece=0.0282","\n","[BPI2017][bs=128, lr=0.0005] Epoch 5: validation_loss = 0.3905 acc=0.8344 f1=0.5913 top3=0.9867 ece=0.0144","\n","[BPI2017][bs=128, lr=0.0005] Epoch 6: validation_loss = 0.3885 acc=0.8297 f1=0.5773 top3=0.9868 ece=0.0188","\n","[BPI2017][bs=128, lr=0.0005] Epoch 7: validation_loss = 0.3844 acc=0.8362 f1=0.5890 top3=0.9864 ece=0.0076","\n","[BPI2017][bs=128, lr=0.0005] Epoch 8: validation_loss = 0.3866 acc=0.8348 f1=0.5879 top3=0.9860 ece=0.0149","\n","[BPI2017][bs=128, lr=0.0005] Epoch 9: validation_loss = 0.3829 acc=0.8377 f1=0.5975 top3=0.9879 ece=0.0115","\n","[BPI2017][bs=128, lr=0.0005] Epoch 10: validation_loss = 0.3841 acc=0.8314 f1=0.5885 top3=0.9880 ece=0.0120","\n","[BPI2017][bs=128, lr=0.0005] Epoch 11: validation_loss = 0.3867 acc=0.8322 f1=0.5942 top3=0.9880 ece=0.0178","\n","[BPI2017][bs=128, lr=0.0005] Epoch 12: validation_loss = 0.3834 acc=0.8361 f1=0.5943 top3=0.9885 ece=0.0116","\n","[BPI2017] samples train/val/test: 63477/13508/13494, vocab=24","\n","[BPI2017][bs=128, lr=0.001] Epoch 1: validation_loss = 0.4098 acc=0.8235 f1=0.5576 top3=0.9847 ece=0.0303","\n","[BPI2017][bs=128, lr=0.001] Epoch 2: validation_loss = 0.4029 acc=0.8268 f1=0.5825 top3=0.9862 ece=0.0205","\n","[BPI2017][bs=128, lr=0.001] Epoch 3: validation_loss = 0.3898 acc=0.8340 f1=0.5780 top3=0.9876 ece=0.0193","\n","[BPI2017][bs=128, lr=0.001] Epoch 4: validation_loss = 0.3907 acc=0.8342 f1=0.5926 top3=0.9859 ece=0.0133","\n","[BPI2017][bs=128, lr=0.001] Epoch 5: validation_loss = 0.3872 acc=0.8384 f1=0.6012 top3=0.9857 ece=0.0180","\n","[BPI2017][bs=128, lr=0.001] Epoch 6: validation_loss = 0.3863 acc=0.8356 f1=0.5980 top3=0.9870 ece=0.0127","\n","[BPI2017][bs=128, lr=0.001] Epoch 7: validation_loss = 0.3838 acc=0.8367 f1=0.5922 top3=0.9876 ece=0.0170","\n","[BPI2017][bs=128, lr=0.001] Epoch 8: validation_loss = 0.3869 acc=0.8317 f1=0.5972 top3=0.9879 ece=0.0203","\n","[BPI2017][bs=128, lr=0.001] Epoch 9: validation_loss = 0.3807 acc=0.8375 f1=0.6030 top3=0.9885 ece=0.0071","\n","[BPI2017][bs=128, lr=0.001] Epoch 10: validation_loss = 0.3839 acc=0.8333 f1=0.5957 top3=0.9869 ece=0.0140","\n","[BPI2017][bs=128, lr=0.001] Epoch 11: validation_loss = 0.3875 acc=0.8213 f1=0.5852 top3=0.9884 ece=0.0239","\n","[BPI2017][bs=128, lr=0.001] Epoch 12: validation_loss = 0.3831 acc=0.8354 f1=0.6045 top3=0.9882 ece=0.0162","\n","[BPI2017] samples train/val/test: 63477/13508/13494, vocab=24","\n","[BPI2017][bs=256, lr=0.0005] Epoch 1: validation_loss = 0.4634 acc=0.8280 f1=0.5604 top3=0.9842 ece=0.0484","\n","[BPI2017][bs=256, lr=0.0005] Epoch 2: validation_loss = 0.4170 acc=0.8297 f1=0.5618 top3=0.9860 ece=0.0294","\n","[BPI2017][bs=256, lr=0.0005] Epoch 3: validation_loss = 0.4056 acc=0.8291 f1=0.5614 top3=0.9853 ece=0.0245","\n","[BPI2017][bs=256, lr=0.0005] Epoch 4: validation_loss = 0.4013 acc=0.8264 f1=0.5576 top3=0.9858 ece=0.0226","\n","[BPI2017][bs=256, lr=0.0005] Epoch 5: validation_loss = 0.3950 acc=0.8304 f1=0.5771 top3=0.9853 ece=0.0175","\n","[BPI2017][bs=256, lr=0.0005] Epoch 6: validation_loss = 0.3927 acc=0.8347 f1=0.5847 top3=0.9865 ece=0.0253","\n","[BPI2017][bs=256, lr=0.0005] Epoch 7: validation_loss = 0.3901 acc=0.8331 f1=0.5863 top3=0.9871 ece=0.0090","\n","[BPI2017][bs=256, lr=0.0005] Epoch 8: validation_loss = 0.3879 acc=0.8315 f1=0.5854 top3=0.9876 ece=0.0137","\n","[BPI2017][bs=256, lr=0.0005] Epoch 9: validation_loss = 0.3887 acc=0.8277 f1=0.5741 top3=0.9867 ece=0.0187","\n","[BPI2017][bs=256, lr=0.0005] Epoch 10: validation_loss = 0.3861 acc=0.8343 f1=0.5962 top3=0.9876 ece=0.0135","\n","[BPI2017][bs=256, lr=0.0005] Epoch 11: validation_loss = 0.3852 acc=0.8355 f1=0.5864 top3=0.9877 ece=0.0122","\n","[BPI2017][bs=256, lr=0.0005] Epoch 12: validation_loss = 0.3850 acc=0.8339 f1=0.5915 top3=0.9868 ece=0.0084","\n","[BPI2017] samples train/val/test: 63477/13508/13494, vocab=24","\n","[BPI2017][bs=256, lr=0.001] Epoch 1: validation_loss = 0.4224 acc=0.8317 f1=0.5674 top3=0.9853 ece=0.0397","\n","[BPI2017][bs=256, lr=0.001] Epoch 2: validation_loss = 0.4015 acc=0.8331 f1=0.5687 top3=0.9862 ece=0.0201","\n","[BPI2017][bs=256, lr=0.001] Epoch 3: validation_loss = 0.3975 acc=0.8276 f1=0.5732 top3=0.9860 ece=0.0163","\n","[BPI2017][bs=256, lr=0.001] Epoch 4: validation_loss = 0.3926 acc=0.8360 f1=0.5987 top3=0.9872 ece=0.0178","\n","[BPI2017][bs=256, lr=0.001] Epoch 5: validation_loss = 0.3894 acc=0.8372 f1=0.5955 top3=0.9873 ece=0.0166","\n","[BPI2017][bs=256, lr=0.001] Epoch 6: validation_loss = 0.3901 acc=0.8357 f1=0.5976 top3=0.9860 ece=0.0160","\n","[BPI2017][bs=256, lr=0.001] Epoch 7: validation_loss = 0.3868 acc=0.8300 f1=0.5913 top3=0.9879 ece=0.0111","\n","[BPI2017][bs=256, lr=0.001] Epoch 8: validation_loss = 0.3901 acc=0.8283 f1=0.5798 top3=0.9872 ece=0.0162","\n","[BPI2017][bs=256, lr=0.001] Epoch 9: validation_loss = 0.3854 acc=0.8333 f1=0.5973 top3=0.9881 ece=0.0134","\n","[BPI2017][bs=256, lr=0.001] Epoch 10: validation_loss = 0.3839 acc=0.8389 f1=0.5991 top3=0.9882 ece=0.0189","\n","[BPI2017][bs=256, lr=0.001] Epoch 11: validation_loss = 0.3830 acc=0.8382 f1=0.6090 top3=0.9865 ece=0.0102","\n","[BPI2017][bs=256, lr=0.001] Epoch 12: validation_loss = 0.3874 acc=0.8315 f1=0.5914 top3=0.9884 ece=0.0168","\n","[BPI2017] Best setting: bs=64 lr=0.001 | val_top3=0.9886 | test_acc=0.8273 test_top3=0.9873 ece=0.0153","\n","[ROAD] samples train/val/test: 19366/4058/3973, vocab=11","\n","[ROAD][bs=64, lr=0.0005] Epoch 1: validation_loss = 0.4037 acc=0.8630 f1=0.5990 top3=0.9975 ece=0.0150","\n","[ROAD][bs=64, lr=0.0005] Epoch 2: validation_loss = 0.3947 acc=0.8652 f1=0.7156 top3=0.9998 ece=0.0213","\n","[ROAD][bs=64, lr=0.0005] Epoch 3: validation_loss = 0.3879 acc=0.8647 f1=0.7148 top3=0.9995 ece=0.0244","\n","[ROAD][bs=64, lr=0.0005] Epoch 4: validation_loss = 0.3824 acc=0.8652 f1=0.7263 top3=0.9995 ece=0.0211","\n","[ROAD][bs=64, lr=0.0005] Epoch 5: validation_loss = 0.3928 acc=0.8652 f1=0.7156 top3=0.9993 ece=0.0472","\n","[ROAD][bs=64, lr=0.0005] Epoch 6: validation_loss = 0.3822 acc=0.8682 f1=0.7338 top3=0.9993 ece=0.0298","\n","[ROAD][bs=64, lr=0.0005] Epoch 7: validation_loss = 0.3916 acc=0.8650 f1=0.7147 top3=0.9993 ece=0.0439","\n","[ROAD][bs=64, lr=0.0005] Epoch 8: validation_loss = 0.3825 acc=0.8677 f1=0.7391 top3=0.9993 ece=0.0145","\n","[ROAD][bs=64, lr=0.0005] Epoch 9: validation_loss = 0.3801 acc=0.8689 f1=0.7373 top3=0.9993 ece=0.0227","\n","[ROAD][bs=64, lr=0.0005] Epoch 10: validation_loss = 0.3839 acc=0.8672 f1=0.7268 top3=0.9993 ece=0.0217","\n","[ROAD][bs=64, lr=0.0005] Epoch 11: validation_loss = 0.3788 acc=0.8667 f1=0.7317 top3=0.9993 ece=0.0174","\n","[ROAD][bs=64, lr=0.0005] Epoch 12: validation_loss = 0.3824 acc=0.8691 f1=0.7594 top3=0.9998 ece=0.0181","\n","[ROAD] samples train/val/test: 19366/4058/3973, vocab=11","\n","[ROAD][bs=64, lr=0.001] Epoch 1: validation_loss = 0.3909 acc=0.8682 f1=0.7419 top3=0.9995 ece=0.0239","\n","[ROAD][bs=64, lr=0.001] Epoch 2: validation_loss = 0.3973 acc=0.8655 f1=0.7266 top3=0.9995 ece=0.0475","\n","[ROAD][bs=64, lr=0.001] Epoch 3: validation_loss = 0.3828 acc=0.8682 f1=0.7436 top3=0.9995 ece=0.0273","\n","[ROAD][bs=64, lr=0.001] Epoch 4: validation_loss = 0.3823 acc=0.8655 f1=0.7264 top3=0.9995 ece=0.0130","\n","[ROAD][bs=64, lr=0.001] Epoch 5: validation_loss = 0.3844 acc=0.8664 f1=0.7316 top3=0.9995 ece=0.0235","\n","[ROAD][bs=64, lr=0.001] Epoch 6: validation_loss = 0.3834 acc=0.8689 f1=0.7463 top3=0.9993 ece=0.0321","\n","[ROAD][bs=64, lr=0.001] Epoch 7: validation_loss = 0.3802 acc=0.8655 f1=0.7266 top3=0.9993 ece=0.0164","\n","[ROAD][bs=64, lr=0.001] Epoch 8: validation_loss = 0.3889 acc=0.8684 f1=0.7413 top3=0.9995 ece=0.0364","\n","[ROAD][bs=64, lr=0.001] Epoch 9: validation_loss = 0.3861 acc=0.8659 f1=0.7274 top3=0.9998 ece=0.0258","\n","[ROAD][bs=64, lr=0.001] Epoch 10: validation_loss = 0.3790 acc=0.8696 f1=0.7508 top3=0.9993 ece=0.0156","\n","[ROAD][bs=64, lr=0.001] Epoch 11: validation_loss = 0.3785 acc=0.8699 f1=0.7512 top3=0.9995 ece=0.0171","\n","[ROAD][bs=64, lr=0.001] Epoch 12: validation_loss = 0.3812 acc=0.8687 f1=0.7481 top3=0.9995 ece=0.0313","\n","[ROAD] samples train/val/test: 19366/4058/3973, vocab=11","\n","[ROAD][bs=128, lr=0.0005] Epoch 1: validation_loss = 0.4353 acc=0.8613 f1=0.4473 top3=0.9901 ece=0.0196","\n","[ROAD][bs=128, lr=0.0005] Epoch 2: validation_loss = 0.3998 acc=0.8637 f1=0.6487 top3=0.9995 ece=0.0237","\n","[ROAD][bs=128, lr=0.0005] Epoch 3: validation_loss = 0.3881 acc=0.8647 f1=0.6957 top3=0.9995 ece=0.0167","\n","[ROAD][bs=128, lr=0.0005] Epoch 4: validation_loss = 0.3883 acc=0.8650 f1=0.7153 top3=0.9995 ece=0.0272","\n","[ROAD][bs=128, lr=0.0005] Epoch 5: validation_loss = 0.3838 acc=0.8652 f1=0.7156 top3=0.9995 ece=0.0108","\n","[ROAD][bs=128, lr=0.0005] Epoch 6: validation_loss = 0.3815 acc=0.8672 f1=0.7279 top3=0.9995 ece=0.0151","\n","[ROAD][bs=128, lr=0.0005] Epoch 7: validation_loss = 0.3821 acc=0.8684 f1=0.7370 top3=0.9993 ece=0.0245","\n","[ROAD][bs=128, lr=0.0005] Epoch 8: validation_loss = 0.3873 acc=0.8691 f1=0.7396 top3=0.9998 ece=0.0261","\n","[ROAD][bs=128, lr=0.0005] Epoch 9: validation_loss = 0.3854 acc=0.8677 f1=0.7295 top3=0.9993 ece=0.0292","\n","[ROAD][bs=128, lr=0.0005] Epoch 10: validation_loss = 0.3838 acc=0.8679 f1=0.7321 top3=0.9998 ece=0.0317","\n","[ROAD][bs=128, lr=0.0005] Epoch 11: validation_loss = 0.3849 acc=0.8652 f1=0.7156 top3=0.9995 ece=0.0311","\n","[ROAD][bs=128, lr=0.0005] Epoch 12: validation_loss = 0.3836 acc=0.8684 f1=0.7326 top3=0.9998 ece=0.0336","\n","[ROAD] samples train/val/test: 19366/4058/3973, vocab=11","\n","[ROAD][bs=128, lr=0.001] Epoch 1: validation_loss = 0.4146 acc=0.8613 f1=0.5575 top3=0.9970 ece=0.0400","\n","[ROAD][bs=128, lr=0.001] Epoch 2: validation_loss = 0.3937 acc=0.8650 f1=0.7147 top3=0.9995 ece=0.0369","\n","[ROAD][bs=128, lr=0.001] Epoch 3: validation_loss = 0.3865 acc=0.8650 f1=0.7155 top3=0.9995 ece=0.0196","\n","[ROAD][bs=128, lr=0.001] Epoch 4: validation_loss = 0.3840 acc=0.8682 f1=0.7327 top3=0.9990 ece=0.0272","\n","[ROAD][bs=128, lr=0.001] Epoch 5: validation_loss = 0.3812 acc=0.8650 f1=0.7153 top3=0.9995 ece=0.0160","\n","[ROAD][bs=128, lr=0.001] Epoch 6: validation_loss = 0.3790 acc=0.8684 f1=0.7330 top3=0.9995 ece=0.0155","\n","[ROAD][bs=128, lr=0.001] Epoch 7: validation_loss = 0.3901 acc=0.8691 f1=0.7400 top3=0.9995 ece=0.0229","\n","[ROAD][bs=128, lr=0.001] Epoch 8: validation_loss = 0.3779 acc=0.8687 f1=0.7370 top3=0.9993 ece=0.0142","\n","[ROAD][bs=128, lr=0.001] Epoch 9: validation_loss = 0.3792 acc=0.8691 f1=0.7504 top3=0.9995 ece=0.0202","\n","[ROAD][bs=128, lr=0.001] Epoch 10: validation_loss = 0.3779 acc=0.8664 f1=0.7314 top3=0.9995 ece=0.0071","\n","[ROAD][bs=128, lr=0.001] Epoch 11: validation_loss = 0.3800 acc=0.8667 f1=0.7210 top3=0.9998 ece=0.0152","\n","[ROAD][bs=128, lr=0.001] Epoch 12: validation_loss = 0.3783 acc=0.8694 f1=0.7313 top3=0.9998 ece=0.0237","\n","[ROAD] samples train/val/test: 19366/4058/3973, vocab=11","\n","[ROAD][bs=256, lr=0.0005] Epoch 1: validation_loss = 0.5017 acc=0.8502 f1=0.4337 top3=0.9830 ece=0.0387","\n","[ROAD][bs=256, lr=0.0005] Epoch 2: validation_loss = 0.4264 acc=0.8610 f1=0.4471 top3=0.9958 ece=0.0289","\n","[ROAD][bs=256, lr=0.0005] Epoch 3: validation_loss = 0.4113 acc=0.8618 f1=0.5649 top3=0.9970 ece=0.0367","\n","[ROAD][bs=256, lr=0.0005] Epoch 4: validation_loss = 0.3937 acc=0.8674 f1=0.6522 top3=0.9998 ece=0.0191","\n","[ROAD][bs=256, lr=0.0005] Epoch 5: validation_loss = 0.3915 acc=0.8682 f1=0.7334 top3=0.9998 ece=0.0299","\n","[ROAD][bs=256, lr=0.0005] Epoch 6: validation_loss = 0.3934 acc=0.8655 f1=0.7388 top3=0.9998 ece=0.0254","\n","[ROAD][bs=256, lr=0.0005] Epoch 7: validation_loss = 0.3863 acc=0.8647 f1=0.7151 top3=0.9995 ece=0.0202","\n","[ROAD][bs=256, lr=0.0005] Epoch 8: validation_loss = 0.3910 acc=0.8657 f1=0.7174 top3=0.9995 ece=0.0378","\n","[ROAD][bs=256, lr=0.0005] Epoch 9: validation_loss = 0.3854 acc=0.8652 f1=0.7156 top3=0.9995 ece=0.0280","\n","[ROAD][bs=256, lr=0.0005] Epoch 10: validation_loss = 0.3817 acc=0.8679 f1=0.7327 top3=0.9998 ece=0.0180","\n","[ROAD][bs=256, lr=0.0005] Epoch 11: validation_loss = 0.3838 acc=0.8647 f1=0.7148 top3=0.9995 ece=0.0230","\n","[ROAD][bs=256, lr=0.0005] Epoch 12: validation_loss = 0.3804 acc=0.8684 f1=0.7330 top3=0.9995 ece=0.0194","\n","[ROAD] samples train/val/test: 19366/4058/3973, vocab=11","\n","[ROAD][bs=256, lr=0.001] Epoch 1: validation_loss = 0.4411 acc=0.8610 f1=0.4471 top3=0.9906 ece=0.0374","\n","[ROAD][bs=256, lr=0.001] Epoch 2: validation_loss = 0.3966 acc=0.8682 f1=0.7307 top3=0.9995 ece=0.0189","\n","[ROAD][bs=256, lr=0.001] Epoch 3: validation_loss = 0.3882 acc=0.8655 f1=0.7372 top3=0.9993 ece=0.0227","\n","[ROAD][bs=256, lr=0.001] Epoch 4: validation_loss = 0.3841 acc=0.8684 f1=0.7422 top3=0.9993 ece=0.0221","\n","[ROAD][bs=256, lr=0.001] Epoch 5: validation_loss = 0.3854 acc=0.8650 f1=0.7153 top3=0.9993 ece=0.0146","\n","[ROAD][bs=256, lr=0.001] Epoch 6: validation_loss = 0.3872 acc=0.8652 f1=0.7156 top3=0.9993 ece=0.0285","\n","[ROAD][bs=256, lr=0.001] Epoch 7: validation_loss = 0.3822 acc=0.8689 f1=0.7465 top3=0.9993 ece=0.0291","\n","[ROAD][bs=256, lr=0.001] Epoch 8: validation_loss = 0.3863 acc=0.8652 f1=0.7261 top3=0.9993 ece=0.0291","\n","[ROAD][bs=256, lr=0.001] Epoch 9: validation_loss = 0.3830 acc=0.8664 f1=0.7299 top3=0.9993 ece=0.0288","\n","[ROAD][bs=256, lr=0.001] Epoch 10: validation_loss = 0.3798 acc=0.8694 f1=0.7493 top3=0.9995 ece=0.0152","\n","[ROAD][bs=256, lr=0.001] Epoch 11: validation_loss = 0.3787 acc=0.8684 f1=0.7439 top3=0.9993 ece=0.0252","\n","[ROAD][bs=256, lr=0.001] Epoch 12: validation_loss = 0.3791 acc=0.8687 f1=0.7425 top3=0.9993 ece=0.0245","\n","[ROAD] Best setting: bs=64 lr=0.0005 | val_top3=0.9998 | test_acc=0.8714 test_top3=1.0000 ece=0.0181","\n","Execution time: 22 minutes seconds (time limit is an hour)."],"parse_metrics_plan":"I will load the saved results from the working directory, parse the nested structure, and print concise best/final metrics per dataset. If a \u201cbest\u201d configuration exists, I will use it for test metrics (and validation top-3); otherwise, I will fall back to the last recorded \u201cfinal\u201d metrics. For training and validation, I will print the latest final metrics available. The script executes immediately without any main guard and does not create any plots.","parse_metrics_code":"import os\nimport numpy as np\n\n\ndef load_experiment_data():\n    working_dir = os.path.join(os.getcwd(), \"working\")\n    path = os.path.join(working_dir, \"experiment_data.npy\")\n    if not os.path.exists(path):\n        print(f\"experiment_data.npy not found at: {path}\")\n        return None\n    try:\n        data = np.load(path, allow_pickle=True).item()\n    except Exception as e:\n        print(f\"Failed to load experiment data: {e}\")\n        return None\n    return data\n\n\ndef extract_final_from_list(lst):\n    # lst is expected to be a list like: [(\"final\", {metrics...}), ...]\n    if not isinstance(lst, (list, tuple)) or len(lst) == 0:\n        return None\n    last = lst[-1]\n    if isinstance(last, (list, tuple)) and len(last) == 2 and isinstance(last[1], dict):\n        return last[1]\n    # Fallback: try to find any dict in reversed order\n    for item in reversed(lst):\n        if (\n            isinstance(item, (list, tuple))\n            and len(item) == 2\n            and isinstance(item[1], dict)\n        ):\n            return item[1]\n        if isinstance(item, dict):\n            return item\n    return None\n\n\ndef print_split_metrics(split_name, metrics_dict):\n    # metrics_dict expected keys: loss, acc, macro_f1, top3, ece\n    if not isinstance(metrics_dict, dict):\n        return\n    name_map = {\n        \"train\": \"training\",\n        \"val\": \"validation\",\n        \"test\": \"test\",\n    }\n    prefix = name_map.get(split_name, split_name)\n    if \"loss\" in metrics_dict:\n        print(f\"{prefix} loss: {metrics_dict['loss']}\")\n    if \"acc\" in metrics_dict:\n        print(f\"{prefix} accuracy: {metrics_dict['acc']}\")\n    if \"macro_f1\" in metrics_dict:\n        print(f\"{prefix} macro F1 score: {metrics_dict['macro_f1']}\")\n    if \"top3\" in metrics_dict:\n        print(f\"{prefix} top-3 accuracy: {metrics_dict['top3']}\")\n    if \"ece\" in metrics_dict:\n        print(f\"{prefix} ECE: {metrics_dict['ece']}\")\n\n\ndef print_best_test_and_val(best_dict):\n    # best contains: batch_size, lr, val_top3, test_acc, test_top3, test_macro_f1, test_ece\n    if not isinstance(best_dict, dict) or len(best_dict) == 0:\n        return False\n    # Validation best\n    if \"val_top3\" in best_dict:\n        print(f\"best validation top-3 accuracy: {best_dict['val_top3']}\")\n    # Test best\n    if \"test_acc\" in best_dict:\n        print(f\"best test accuracy: {best_dict['test_acc']}\")\n    if \"test_top3\" in best_dict:\n        print(f\"best test top-3 accuracy: {best_dict['test_top3']}\")\n    if \"test_macro_f1\" in best_dict:\n        print(f\"best test macro F1 score: {best_dict['test_macro_f1']}\")\n    if \"test_ece\" in best_dict:\n        print(f\"best test ECE: {best_dict['test_ece']}\")\n    return True\n\n\ndef run():\n    experiment_data = load_experiment_data()\n    if (\n        experiment_data is None\n        or not isinstance(experiment_data, dict)\n        or len(experiment_data) == 0\n    ):\n        # Nothing to print\n        return\n\n    for ds_name, ds_obj in experiment_data.items():\n        print(ds_name)\n        if not isinstance(ds_obj, dict):\n            continue\n\n        # Prefer best metrics for validation top-3 and test metrics if available\n        best_printed = False\n        if (\n            \"best\" in ds_obj\n            and isinstance(ds_obj[\"best\"], dict)\n            and len(ds_obj[\"best\"]) > 0\n        ):\n            best_printed = print_best_test_and_val(ds_obj[\"best\"])\n\n        # Final training and validation metrics (last recorded)\n        metrics_container = ds_obj.get(\"metrics\", {})\n        if isinstance(metrics_container, dict):\n            # Training final\n            tr_final = extract_final_from_list(metrics_container.get(\"train\", []))\n            if tr_final:\n                print_split_metrics(\"train\", tr_final)\n            # Validation final (print in addition to best val top-3 to show loss/acc/F1/ECE)\n            va_final = extract_final_from_list(metrics_container.get(\"val\", []))\n            if va_final:\n                print_split_metrics(\"val\", va_final)\n            # If no best, print final test metrics\n            if not best_printed:\n                te_final = extract_final_from_list(metrics_container.get(\"test\", []))\n                if te_final:\n                    print_split_metrics(\"test\", te_final)\n\n\nrun()\n","parse_term_out":["BPI2012","\n","best validation top-3 accuracy: 0.9817131857555341","\n","best test accuracy: 0.7786675564453343","\n","best test top-3 accuracy: 0.9795350906462018","\n","best test macro F1 score: 0.5203529832123652","\n","best test ECE: 0.024086250490904147","\n","training loss: 0.5182093765343713","\n","training accuracy: 0.775826260865106","\n","training macro F1 score: 0.5355790796105326","\n","training top-3 accuracy: 0.9834876028819773","\n","training ECE: 0.026932697338659467","\n","validation loss: 0.5163689511572661","\n","validation accuracy: 0.7779114533205005","\n","validation macro F1 score: 0.4884874830109363","\n","validation top-3 accuracy: 0.9812319538017324","\n","validation ECE: 0.023136049978743384","\n","BPI2017","\n","best validation top-3 accuracy: 0.988599348534202","\n","best test accuracy: 0.8273306654809545","\n","best test top-3 accuracy: 0.9872535941900104","\n","best test macro F1 score: 0.6009938729444291","\n","best test ECE: 0.015301321384835033","\n","training loss: 0.39770616359021244","\n","training accuracy: 0.8273547899239094","\n","training macro F1 score: 0.6036030972793732","\n","training top-3 accuracy: 0.9879326370181325","\n","training ECE: 0.010086089828047916","\n","validation loss: 0.3874257102516017","\n","validation accuracy: 0.8315072549600236","\n","validation macro F1 score: 0.5914435900146698","\n","validation top-3 accuracy: 0.9883772579212319","\n","validation ECE: 0.01676174988134535","\n","ROAD","\n","best validation top-3 accuracy: 0.9997535731887629","\n","best test accuracy: 0.871381827334508","\n","best test top-3 accuracy: 1.0","\n","best test macro F1 score: 0.7490852700507147","\n","best test ECE: 0.018063319267987786","\n","training loss: 0.3843761781153816","\n","training accuracy: 0.8788598574821853","\n","training macro F1 score: 0.6474398709898581","\n","training top-3 accuracy: 0.9988639884333368","\n","training ECE: 0.016807799233787505","\n","validation loss: 0.39664561897442807","\n","validation accuracy: 0.8681616559881715","\n","validation macro F1 score: 0.7307272874133772","\n","validation top-3 accuracy: 0.9995071463775259","\n","validation ECE: 0.018899630771710283","\n","Execution time: a moment seconds (time limit is an hour)."],"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":1328.1466343402863,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"","exp_results_dir":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838","metric":{"value":{"metric_names":[{"metric_name":"training loss","lower_is_better":true,"description":"Cross-entropy loss measured on the training split at the end of training.","data":[{"dataset_name":"BPI2012","final_value":0.5182093765343713,"best_value":0.5182093765343713},{"dataset_name":"BPI2017","final_value":0.39770616359021244,"best_value":0.39770616359021244},{"dataset_name":"ROAD","final_value":0.3843761781153816,"best_value":0.3843761781153816}]},{"metric_name":"training accuracy","lower_is_better":false,"description":"Classification accuracy on the training split at the end of training.","data":[{"dataset_name":"BPI2012","final_value":0.775826260865106,"best_value":0.775826260865106},{"dataset_name":"BPI2017","final_value":0.8273547899239094,"best_value":0.8273547899239094},{"dataset_name":"ROAD","final_value":0.8788598574821853,"best_value":0.8788598574821853}]},{"metric_name":"training macro F1 score","lower_is_better":false,"description":"Macro-averaged F1 score on the training split at the end of training.","data":[{"dataset_name":"BPI2012","final_value":0.5355790796105326,"best_value":0.5355790796105326},{"dataset_name":"BPI2017","final_value":0.6036030972793732,"best_value":0.6036030972793732},{"dataset_name":"ROAD","final_value":0.6474398709898581,"best_value":0.6474398709898581}]},{"metric_name":"training top-3 accuracy","lower_is_better":false,"description":"Top-3 accuracy on the training split at the end of training.","data":[{"dataset_name":"BPI2012","final_value":0.9834876028819773,"best_value":0.9834876028819773},{"dataset_name":"BPI2017","final_value":0.9879326370181325,"best_value":0.9879326370181325},{"dataset_name":"ROAD","final_value":0.9988639884333368,"best_value":0.9988639884333368}]},{"metric_name":"training ECE","lower_is_better":true,"description":"Expected Calibration Error on the training split at the end of training.","data":[{"dataset_name":"BPI2012","final_value":0.026932697338659467,"best_value":0.026932697338659467},{"dataset_name":"BPI2017","final_value":0.010086089828047916,"best_value":0.010086089828047916},{"dataset_name":"ROAD","final_value":0.016807799233787505,"best_value":0.016807799233787505}]},{"metric_name":"validation loss","lower_is_better":true,"description":"Cross-entropy loss measured on the validation split at the end of training.","data":[{"dataset_name":"BPI2012","final_value":0.5163689511572661,"best_value":0.5163689511572661},{"dataset_name":"BPI2017","final_value":0.3874257102516017,"best_value":0.3874257102516017},{"dataset_name":"ROAD","final_value":0.39664561897442807,"best_value":0.39664561897442807}]},{"metric_name":"validation accuracy","lower_is_better":false,"description":"Classification accuracy on the validation split at the end of training.","data":[{"dataset_name":"BPI2012","final_value":0.7779114533205005,"best_value":0.7779114533205005},{"dataset_name":"BPI2017","final_value":0.8315072549600236,"best_value":0.8315072549600236},{"dataset_name":"ROAD","final_value":0.8681616559881715,"best_value":0.8681616559881715}]},{"metric_name":"validation macro F1 score","lower_is_better":false,"description":"Macro-averaged F1 score on the validation split at the end of training.","data":[{"dataset_name":"BPI2012","final_value":0.4884874830109363,"best_value":0.4884874830109363},{"dataset_name":"BPI2017","final_value":0.5914435900146698,"best_value":0.5914435900146698},{"dataset_name":"ROAD","final_value":0.7307272874133772,"best_value":0.7307272874133772}]},{"metric_name":"validation top-3 accuracy","lower_is_better":false,"description":"Top-3 accuracy on the validation split; both final value and recorded best value are provided.","data":[{"dataset_name":"BPI2012","final_value":0.9812319538017324,"best_value":0.9817131857555341},{"dataset_name":"BPI2017","final_value":0.9883772579212319,"best_value":0.988599348534202},{"dataset_name":"ROAD","final_value":0.9995071463775259,"best_value":0.9997535731887629}]},{"metric_name":"validation ECE","lower_is_better":true,"description":"Expected Calibration Error on the validation split at the end of training.","data":[{"dataset_name":"BPI2012","final_value":0.023136049978743384,"best_value":0.023136049978743384},{"dataset_name":"BPI2017","final_value":0.01676174988134535,"best_value":0.01676174988134535},{"dataset_name":"ROAD","final_value":0.018899630771710283,"best_value":0.018899630771710283}]},{"metric_name":"test accuracy","lower_is_better":false,"description":"Best recorded classification accuracy on the test split.","data":[{"dataset_name":"BPI2012","final_value":0.7786675564453343,"best_value":0.7786675564453343},{"dataset_name":"BPI2017","final_value":0.8273306654809545,"best_value":0.8273306654809545},{"dataset_name":"ROAD","final_value":0.871381827334508,"best_value":0.871381827334508}]},{"metric_name":"test top-3 accuracy","lower_is_better":false,"description":"Best recorded top-3 accuracy on the test split.","data":[{"dataset_name":"BPI2012","final_value":0.9795350906462018,"best_value":0.9795350906462018},{"dataset_name":"BPI2017","final_value":0.9872535941900104,"best_value":0.9872535941900104},{"dataset_name":"ROAD","final_value":1.0,"best_value":1.0}]},{"metric_name":"test macro F1 score","lower_is_better":false,"description":"Best recorded macro-averaged F1 score on the test split.","data":[{"dataset_name":"BPI2012","final_value":0.5203529832123652,"best_value":0.5203529832123652},{"dataset_name":"BPI2017","final_value":0.6009938729444291,"best_value":0.6009938729444291},{"dataset_name":"ROAD","final_value":0.7490852700507147,"best_value":0.7490852700507147}]},{"metric_name":"test ECE","lower_is_better":true,"description":"Best recorded Expected Calibration Error on the test split.","data":[{"dataset_name":"BPI2012","final_value":0.024086250490904147,"best_value":0.024086250490904147},{"dataset_name":"BPI2017","final_value":0.015301321384835033,"best_value":0.015301321384835033},{"dataset_name":"ROAD","final_value":0.018063319267987786,"best_value":0.018063319267987786}]}]},"maximize":null,"name":null,"description":null},"is_buggy":false,"is_buggy_plots":false,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":["../../logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2017_loss_curves_next_activity.png","../../logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2012_loss_curves_next_activity.png","../../logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2017_reliability_test.png","../../logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/ROAD_reliability_test.png","../../logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/ROAD_confusion_matrix_next_activity_test.png","../../logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/ROAD_loss_curves_next_activity.png","../../logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2017_confusion_matrix_next_activity_test.png","../../logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2012_confusion_matrix_next_activity_test.png","../../logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2012_reliability_test.png"],"plot_paths":["experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2017_loss_curves_next_activity.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2012_loss_curves_next_activity.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2017_reliability_test.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/ROAD_reliability_test.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/ROAD_confusion_matrix_next_activity_test.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/ROAD_loss_curves_next_activity.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2017_confusion_matrix_next_activity_test.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2012_confusion_matrix_next_activity_test.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2012_reliability_test.png"],"plot_analyses":[{"analysis":"The BPI2017 loss curves for next-activity prediction show a rapid decrease in both training and validation losses within the first few epochs, indicating that the model quickly learns the underlying patterns. However, the convergence towards the end suggests limited overfitting, as the validation loss stabilizes, closely following the training loss. The model appears to have generalized well on this dataset.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2017_loss_curves_next_activity.png"},{"analysis":"The BPI2012 loss curves similarly depict a quick reduction in loss values for both training and validation sets. The final epochs show stable loss values, suggesting that the model has effectively learned patterns without significant overfitting on this dataset. Both loss curves indicate successful tuning of the model's hyperparameters.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2012_loss_curves_next_activity.png"},{"analysis":"The BPI2017 reliability plot shows the model's accuracy closely aligning with the confidence levels, especially at higher confidences. This indicates that the model's predictions are reliable and well-calibrated, with accuracy increasing as confidence grows. It's a positive sign of model performance.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2017_reliability_test.png"},{"analysis":"The ROAD reliability plot demonstrates a good calibration between confidence and accuracy, although there is a slight deviation from the ideal line at lower confidence levels. This suggests that while the model performs well overall, there may be room for improvement in predictions at lower confidence levels.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/ROAD_reliability_test.png"},{"analysis":"In the ROAD confusion matrix, there's a concentration of predictions along the diagonal, indicating good accuracy in predicting the correct next-activity. However, there are some off-diagonal predictions, suggesting areas where misclassification occurs, which could be further analyzed to improve model accuracy.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/ROAD_confusion_matrix_next_activity_test.png"},{"analysis":"The ROAD loss curves show a consistent decrease in loss values, similar to the previous datasets, with stabilization towards the end. The close alignment of training and validation loss curves suggests effective learning and minimal overfitting.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/ROAD_loss_curves_next_activity.png"},{"analysis":"The BPI2017 confusion matrix shows a strong diagonal line, indicating the model's effectiveness in predicting the correct next-activity. There are few off-diagonal errors, suggesting high accuracy and good model performance for this dataset.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2017_confusion_matrix_next_activity_test.png"},{"analysis":"The BPI2012 confusion matrix also shows a concentration along the diagonal, with some off-diagonal misclassifications. These errors indicate areas for potential improvement, but overall, the model demonstrates good predictive accuracy for this dataset.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2012_confusion_matrix_next_activity_test.png"},{"analysis":"The BPI2012 reliability plot shows a close alignment between accuracy and confidence, with the model's accuracy increasing alongside confidence levels. This indicates reliable and well-calibrated predictions, similar to the BPI2017 reliability plot.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_b6970d0586c74652a8d858ed9350bd81_proc_361838/BPI2012_reliability_test.png"}],"vlm_feedback_summary":"The plots received from the experiments provide meaningful insights into the model's performance across different datasets and metrics. The loss curves consistently show effective learning with minimal overfitting, suggesting well-tuned hyperparameters. Reliability plots indicate well-calibrated predictions, particularly at higher confidence levels, but highlight areas for improvement at lower confidences. Confusion matrices demonstrate generally high accuracy in next-activity predictions, with some misclassifications pointing to opportunities for further refinement. Overall, the experiments appear to be progressing positively towards the research goals.","datasets_successfully_tested":["BPI2017","BPI2012","ROAD"],"ablation_name":null,"hyperparam_name":null,"is_seed_node":false,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"import os\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score\nimport random\nimport warnings\n\n# Use pm4py to load local XES files\nwarnings.filterwarnings(\"ignore\")\ntry:\n    import pm4py\n    from pm4py.objects.log.importer.xes import importer as xes_importer\nexcept Exception as e:\n    pm4py = None\n\n# Device handling\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n# Experiment data structure following the naming convention\nexperiment_data = {\n    \"max_prefix_len\": {\n        # dataset_name: filled at runtime\n    }\n}\n\n\n# Reproducibility\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# Utilities to find and load XES\ndef find_xes_files():\n    candidates = []\n    search_dirs = [os.getcwd(), os.path.join(os.getcwd(), \"data\")]\n    for sd in search_dirs:\n        if os.path.isdir(sd):\n            for fn in os.listdir(sd):\n                if fn.lower().endswith(\".xes\") or fn.lower().endswith(\".xes.gz\"):\n                    candidates.append(os.path.join(sd, fn))\n    return list(sorted(set(candidates)))\n\n\ndef load_xes_to_df(filepath):\n    log = xes_importer.apply(filepath)\n    # pm4py conversion to dataframe\n    try:\n        df = pm4py.convert_to_dataframe(log)\n    except Exception:\n        from pm4py.objects.conversion.log import converter as log_converter\n\n        df = log_converter.apply(log, variant=log_converter.Variants.TO_DATA_FRAME)\n    # Standardize columns\n    col_map = {}\n    if \"case:concept:name\" in df.columns:\n        col_map[\"case:concept:name\"] = \"case_id\"\n    if \"concept:name\" in df.columns:\n        col_map[\"concept:name\"] = \"activity\"\n    if \"time:timestamp\" in df.columns:\n        col_map[\"time:timestamp\"] = \"timestamp\"\n    if \"lifecycle:transition\" in df.columns:\n        col_map[\"lifecycle:transition\"] = \"lifecycle\"\n    df = df.rename(columns=col_map)\n    needed = [\"case_id\", \"activity\", \"timestamp\"]\n    for c in needed:\n        if c not in df.columns:\n            raise ValueError(f\"Missing required column {c} in {filepath}\")\n    # Ensure timestamp is UTC-aware\n    df[\"timestamp\"] = pd.to_datetime(df[\"timestamp\"], utc=True)\n    # Ensure case_id and activity are strings\n    df[\"case_id\"] = df[\"case_id\"].astype(str)\n    df[\"activity\"] = df[\"activity\"].astype(str)\n    # Keep subset columns for consistency\n    keep_cols = [\"case_id\", \"activity\", \"timestamp\"]\n    if \"lifecycle\" in df.columns:\n        keep_cols.append(\"lifecycle\")\n    df = df[keep_cols].copy()\n    return df\n\n\ndef load_datasets_from_xes():\n    datasets = {}\n    files = find_xes_files()\n    if len(files) == 0 or pm4py is None:\n        # Fallback to synthetic small dataset to keep script executable\n        print(\n            \"[warn] No XES files found or pm4py not available. Generating synthetic dataset.\"\n        )\n        # Create a tiny synthetic event log\n        rows = []\n        rng = np.random.RandomState(42)\n        activities = [\"A\", \"B\", \"C\", \"D\", \"E\"]\n        for cid in range(1, 301):\n            t0 = pd.Timestamp(\"2020-01-01\", tz=\"UTC\") + pd.Timedelta(days=int(cid % 30))\n            T = rng.randint(3, 10)\n            ts = t0\n            for i in range(T):\n                act = activities[rng.randint(0, len(activities))]\n                rows.append(\n                    {\n                        \"case_id\": f\"C{cid}\",\n                        \"activity\": act,\n                        \"timestamp\": ts,\n                        \"lifecycle\": \"complete\",\n                    }\n                )\n                ts = ts + pd.Timedelta(hours=int(rng.randint(1, 48)))\n        df = pd.DataFrame(rows)\n        datasets[\"SYNTH\"] = df\n        return datasets\n    for fp in files:\n        try:\n            df = load_xes_to_df(fp)\n            name = os.path.splitext(os.path.basename(fp))[0]\n            datasets[name] = df\n        except Exception as e:\n            print(f\"[warn] Failed to load {fp}: {e}\")\n    if len(datasets) == 0:\n        print(\"[warn] No datasets successfully loaded; creating synthetic fallback.\")\n        return load_datasets_from_xes()\n    return datasets\n\n\n# Build prefixes\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n        if len(df) == 0:\n            df = df.copy()\n            df = df.sort_values([\"case_id\", \"timestamp\"])\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}  # 0 PAD\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        ts_ns = pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy()\n        ts = (ts_ns // 10**9).astype(np.int64)\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str).tolist()], dtype=np.int64\n        )\n\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            seq_acts = acts_ids[:k].tolist()\n            seq_feats = feats[:k]\n            target = int(acts_ids[k])\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": seq_acts,\n                    \"seq_feats\": seq_feats.copy(),\n                    \"target\": target,\n                    \"last_ts\": int(ts[k - 1]),\n                    \"next_ts\": int(ts[k]),\n                }\n            )\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n    ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n    for s in samples:\n        if s[\"seq_feats\"].shape[0] > 0:\n            s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n            s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\n# Time-based split by case start time\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    out = {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, preds_probs = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            preds_probs.append(probs.detach().cpu().numpy())\n            # top-3 correctness\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys)\n    y_pred = np.array(preds_top1)\n    mask = y_true != pad_idx\n    y_true = y_true[mask]\n    y_pred = y_pred[mask]\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    probs_concat = (\n        np.concatenate(preds_probs, axis=0)\n        if len(preds_probs) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return avg_loss, acc, f1, top3, y_true, y_pred, probs_concat\n\n\ndef prepare_splits(df, max_prefix_len):\n    # cap to 5000 earliest cases for speed\n    try:\n        starts = (\n            df.sort_values(\"timestamp\")\n            .groupby(\"case_id\")[\"timestamp\"]\n            .min()\n            .reset_index()\n        )\n        if len(starts) > 5000:\n            keep_cases = set(starts.iloc[:5000][\"case_id\"])\n            df = df[df[\"case_id\"].isin(keep_cases)].copy()\n    except Exception:\n        pass\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # Renormalize using train stats\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm_samples(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm_samples(samples_train)\n            norm_samples(samples_val)\n            norm_samples(samples_test)\n    return samples_train, samples_val, samples_test, act2id, pad_id\n\n\ndef train_eval_run(\n    df,\n    dataset_name,\n    max_prefix_len,\n    max_epochs=10,\n    batch_size=128,\n    lr=1e-3,\n    verbose=False,\n):\n    samples_train, samples_val, samples_test, act2id, pad_id = prepare_splits(\n        df, max_prefix_len\n    )\n    if len(samples_train) == 0 or len(act2id) < 2:\n        return None\n    ds_train = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_val = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_test = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=True,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_test = DataLoader(\n        ds_test,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n\n    model = LSTMBaseline(\n        vocab_size=len(act2id),\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    best_val_top3 = -1.0\n    best_state = None\n    hist = {\n        \"train_loss\": [],\n        \"val_loss\": [],\n        \"val_acc\": [],\n        \"val_f1\": [],\n        \"val_top3\": [],\n    }\n    for epoch in range(1, max_epochs + 1):\n        model.train()\n        total = 0\n        running_loss = 0.0\n        for batch in dl_train:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            optimizer.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item() * logits.size(0)\n            total += logits.size(0)\n        train_loss = running_loss / max(1, total)\n        val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n            model, dl_val, criterion, device, len(act2id), pad_id\n        )\n        hist[\"train_loss\"].append(train_loss)\n        hist[\"val_loss\"].append(val_loss)\n        hist[\"val_acc\"].append(val_acc)\n        hist[\"val_f1\"].append(val_f1)\n        hist[\"val_top3\"].append(val_top3)\n        if verbose:\n            print(\n                f\"[{dataset_name}] prefix={max_prefix_len} epoch {epoch}: val_loss={val_loss:.4f} acc={val_acc:.4f} f1={val_f1:.4f} top3={val_top3:.4f}\"\n            )\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_state = {k: v.cpu().clone() for k, v in model.state_dict().items()}\n\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n\n    train_loss, train_acc, train_f1, train_top3, _, _, _ = evaluate(\n        model, dl_train, criterion, device, len(act2id), pad_id\n    )\n    val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n        model, dl_val, criterion, device, len(act2id), pad_id\n    )\n    test_loss, test_acc, test_f1, test_top3, y_true_t, y_pred_t, probs_t = evaluate(\n        model, dl_test, criterion, device, len(act2id), pad_id\n    )\n\n    result = {\n        \"hist\": hist,\n        \"final\": {\n            \"train\": {\n                \"loss\": train_loss,\n                \"acc\": train_acc,\n                \"macro_f1\": train_f1,\n                \"top3\": train_top3,\n            },\n            \"val\": {\n                \"loss\": val_loss,\n                \"acc\": val_acc,\n                \"macro_f1\": val_f1,\n                \"top3\": val_top3,\n            },\n            \"test\": {\n                \"loss\": test_loss,\n                \"acc\": test_acc,\n                \"macro_f1\": test_f1,\n                \"top3\": test_top3,\n            },\n        },\n        \"y_true_test\": y_true_t.tolist(),\n        \"y_pred_test\": y_pred_t.tolist(),\n        \"test_probs\": probs_t.astype(np.float32),\n        \"vocab_size\": len(act2id),\n        \"pad_id\": pad_id,\n    }\n    return result\n\n\ndef main():\n    datasets = load_datasets_from_xes()\n    # Hyperparameter candidates\n    prefix_candidates = [5, 10, 15, 20, 30]\n    for dname, df in datasets.items():\n        print(f\"\\n=== Dataset: {dname} ===\")\n        experiment_data[\"max_prefix_len\"].setdefault(\n            dname,\n            {\n                \"metrics\": {\"train\": [], \"val\": []},\n                \"losses\": {\"train\": [], \"val\": []},\n                \"predictions\": [],\n                \"ground_truth\": [],\n                \"runs\": [],\n                \"epochs_check\": {},\n            },\n        )\n\n        # Epochs check at prefix=10\n        print(\"Epochs improvement check at max_prefix_len=10...\")\n        res_10e = train_eval_run(\n            df,\n            dname,\n            max_prefix_len=10,\n            max_epochs=10,\n            batch_size=128,\n            lr=1e-3,\n            verbose=False,\n        )\n        res_20e = train_eval_run(\n            df,\n            dname,\n            max_prefix_len=10,\n            max_epochs=20,\n            batch_size=128,\n            lr=1e-3,\n            verbose=False,\n        )\n        if res_10e is None or res_20e is None:\n            print(\"Not enough data to train for this dataset. Skipping.\")\n            continue\n        top3_10 = res_10e[\"final\"][\"val\"][\"top3\"]\n        top3_20 = res_20e[\"final\"][\"val\"][\"top3\"]\n        epoch_improved = top3_20 > top3_10 + 0.005\n        experiment_data[\"max_prefix_len\"][dname][\"epochs_check\"] = {\n            \"val_top3_10epochs\": float(top3_10),\n            \"val_top3_20epochs\": float(top3_20),\n            \"improved\": bool(epoch_improved),\n        }\n        print(\n            f\"Epochs check: val_top3@10ep={top3_10:.4f}, @20ep={top3_20:.4f}, improved={epoch_improved}\"\n        )\n\n        # Hyperparameter sweep over max_prefix_len\n        for mlen in prefix_candidates:\n            print(f\"Tuning run: max_prefix_len={mlen}\")\n            res = train_eval_run(\n                df,\n                dname,\n                max_prefix_len=mlen,\n                max_epochs=10,\n                batch_size=128,\n                lr=1e-3,\n                verbose=False,\n            )\n            if res is None:\n                print(f\"Skipping prefix_len={mlen} due to insufficient data.\")\n                continue\n            # Record per-epoch losses and metrics\n            hist = res[\"hist\"]\n            # Save in standardized containers; tag with hyperparam\n            experiment_data[\"max_prefix_len\"][dname][\"losses\"][\"train\"].append(\n                {\n                    \"max_prefix_len\": mlen,\n                    \"loss_per_epoch\": np.array(hist[\"train_loss\"], dtype=np.float32),\n                }\n            )\n            experiment_data[\"max_prefix_len\"][dname][\"losses\"][\"val\"].append(\n                {\n                    \"max_prefix_len\": mlen,\n                    \"loss_per_epoch\": np.array(hist[\"val_loss\"], dtype=np.float32),\n                }\n            )\n            experiment_data[\"max_prefix_len\"][dname][\"metrics\"][\"val\"].append(\n                {\n                    \"max_prefix_len\": mlen,\n                    \"acc_per_epoch\": np.array(hist[\"val_acc\"], dtype=np.float32),\n                    \"macro_f1_per_epoch\": np.array(hist[\"val_f1\"], dtype=np.float32),\n                    \"top3_per_epoch\": np.array(hist[\"val_top3\"], dtype=np.float32),\n                }\n            )\n            experiment_data[\"max_prefix_len\"][dname][\"metrics\"][\"train\"].append(\n                {\n                    \"max_prefix_len\": mlen,\n                    \"loss_per_epoch\": np.array(hist[\"train_loss\"], dtype=np.float32),\n                }\n            )\n            # Final results\n            final = res[\"final\"]\n            run_record = {\n                \"max_prefix_len\": mlen,\n                \"final_train\": final[\"train\"],\n                \"final_val\": final[\"val\"],\n                \"final_test\": final[\"test\"],\n            }\n            experiment_data[\"max_prefix_len\"][dname][\"runs\"].append(run_record)\n            # Predictions\n            experiment_data[\"max_prefix_len\"][dname][\"predictions\"].append(\n                {\n                    \"max_prefix_len\": mlen,\n                    \"y_pred_test\": np.array(res[\"y_pred_test\"], dtype=np.int64),\n                }\n            )\n            experiment_data[\"max_prefix_len\"][dname][\"ground_truth\"].append(\n                {\n                    \"max_prefix_len\": mlen,\n                    \"y_true_test\": np.array(res[\"y_true_test\"], dtype=np.int64),\n                }\n            )\n        # Optionally identify best prefix by val top-3\n        best_prefix = None\n        best_val_top3 = -1.0\n        for r in experiment_data[\"max_prefix_len\"][dname][\"runs\"]:\n            vt3 = r[\"final_val\"][\"top3\"]\n            if vt3 > best_val_top3:\n                best_val_top3 = vt3\n                best_prefix = r[\"max_prefix_len\"]\n        print(\n            f\"[{dname}] Best max_prefix_len by val top-3: {best_prefix} (val_top3={best_val_top3:.4f})\"\n        )\n\n    # Save all experiment data as a single numpy file as required\n    np.save(\"experiment_data.npy\", experiment_data)\n\n\nif __name__ == \"__main__\":\n    main()\n","plan":"Hyperparam tuning name: max_prefix_len.\nI will add a hyperparameter sweep over max_prefix_len to test values [5, 10, 15, 20, 30] and compare validation metrics (accuracy, macro-F1, top-3). Before sweeping, I will check if simply increasing training epochs (10 vs. 20) at max_prefix_len=10 improves validation top-3; if not, I proceed with the sweep. The implementation will use pm4py to load local XES files, perform time-based splits, and train an LSTM baseline while collecting and saving detailed metrics and predictions into a single experiment_data.npy, organized by hyperparameter and dataset. The code remains self-contained and executes the full pipeline without external dependencies beyond pm4py and PyTorch.","overall_plan":"","plot_code":null,"plot_plan":null,"step":8,"id":"a1bad1cf5aec4ddfbb370ed8a179b41b","ctime":1757759667.500611,"_term_out":["Using device: cuda","\n","Execution time: a second seconds (time limit is an hour)."],"parse_metrics_plan":"","parse_metrics_code":"","parse_term_out":null,"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":1.0331785678863525,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"The run output is essentially empty (only shows device and a harness time note), indicating the experiment did not actually execute the tuning/evaluation loop. There are concrete issues in the code that would prevent meeting the stage goals even if it ran:\n\n1) Data discovery bug: find_xes_files only searches CWD and CWD/data, ignoring the mandated ./input directory (and typical parent/workspace inputs). As a result, local BPI 2012/2017/ROAD logs in input/* will not be found, triggering the synthetic fallback and violating the requirement to use those logs.\n\n2) Silent synthetic fallback: If pm4py is missing or no XES are found, the code silently generates a synthetic dataset and proceeds. This violates the PPM constraints (must use local XES logs and evaluate on BPI 2017 and Road Traffic Fine). The script should fail loudly or instruct installation of pm4py instead of proceeding with synthetic data for this stage.\n\n3) Missing required targets and metrics: The implementation only supports next-activity classification. It does not implement remaining_time or SLA targets or their metrics. For baseline_tuning, at least per-log metrics for required logs and the specified metrics must be produced.\n\n4) Per-log evaluation not ensured: The loader names datasets by filename and does not ensure loading the required BPI2017 and ROAD logs. There is no explicit per-log reporting for those two required datasets in the output shown.\n\n5) Output/traceability: The script saves a numpy .npy with a nested dict of numpy arrays; many runners disallow pickled numpy objects. Prefer JSON/CSV for metrics and keep arrays as lists to avoid serialization issues.\n\n6) Minor: xes pm4py import is optional; if import succeeds but logs are compressed or placed in ./input, they still won\u2019t be discovered due to (1). Also, no resource features are included despite the research idea, but that is acceptable for the LSTM baseline; however, it undermines the resource-centric angle.\n\nProposed fixes:\n- Replace find_xes_files with robust discovery that prioritizes ./input and common workspace paths (reuse _resolve_data_dir from ai_scientist/ideas/my_research_topic.py). Search for patterns matching BPI_Challenge_2012, BPI_Challenge_2017, and Road_Traffic_Fine_Management_Process.\n- Remove synthetic fallback for this stage. If pm4py is missing or no logs are found, raise an error with clear instructions to install pm4py and place XES logs under ./input.\n- Ensure explicit loading and separate evaluation for BPI2017 and ROAD, maintaining time-based splits, and report per-log metrics (acc/macro-F1/top-3) at minimum for next-activity.\n- If extending targets, add selectable target='next_activity'|'remaining_time'|'SLA' and compute the required metrics (MAE/RMSE/MAPE for time; AUC/F1 for SLA) without changing the model family.\n- Improve logging so epochs, hyperparameter sweeps, and best-prefix selection are printed for each dataset, and persist results to JSON (metrics per epoch and final per split) for reproducibility.\n- Optional: Validate that train/val/test case sets are disjoint and ordered by start time, and log counts to confirm no leakage.","exp_results_dir":null,"metric":{"value":null,"maximize":null,"name":null,"description":null},"is_buggy":true,"is_buggy_plots":null,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":[],"plot_paths":[],"plot_analyses":[],"vlm_feedback_summary":[],"datasets_successfully_tested":[],"ablation_name":null,"hyperparam_name":"max_prefix_len","is_seed_node":false,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"import os\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score\nimport random\nimport matplotlib.pyplot as plt  # not used for saving, kept for compatibility\nfrom datetime import datetime\n\n# Device handling\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n\n# Reproducibility\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n# Experiment data structure as required\nexperiment_data = {\n    \"hyperparam_tuning_type_1\": {\n        # dataset_name: {...}\n    }\n}\n\n\n# pm4py loader utilities\ndef load_xes_to_df(path):\n    try:\n        import pm4py\n    except Exception as e:\n        print(\"pm4py is required to load XES files. Please install pm4py.\")\n        raise e\n    log = pm4py.read_xes(path)\n    rows = []\n    for case in log:\n        case_id = case.attributes.get(\"concept:name\", None)\n        for ev in case:\n            act = ev.get(\"concept:name\", None)\n            ts = ev.get(\"time:timestamp\", None)\n            lc = ev.get(\"lifecycle:transition\", None)\n            if ts is not None and not isinstance(ts, pd.Timestamp):\n                try:\n                    ts = pd.to_datetime(ts, utc=True)\n                except Exception:\n                    ts = pd.Timestamp(ts, tz=\"UTC\")\n            rows.append(\n                {\n                    \"case_id\": str(case_id),\n                    \"activity\": str(act),\n                    \"timestamp\": ts,\n                    \"lifecycle\": str(lc) if lc is not None else None,\n                }\n            )\n    df = pd.DataFrame(rows)\n    df = df.dropna(subset=[\"case_id\", \"activity\", \"timestamp\"])\n    df[\"timestamp\"] = pd.to_datetime(df[\"timestamp\"], utc=True)\n    return df\n\n\ndef discover_datasets():\n    # Try common filenames; collect all present\n    candidates = {\n        \"BPI2012\": [\"BPI_Challenge_2012.xes\", \"BPI2012.xes\", \"BPI2012_COMPLETE.xes\"],\n        \"BPI2017\": [\"BPI2017.xes\", \"BPI_Challenge_2017.xes\"],\n        \"ROAD\": [\"Road_Traffic_Fine_Management_Process.xes\", \"ROAD.xes\"],\n    }\n    found = {}\n    cwd = os.getcwd()\n    for name, files in candidates.items():\n        for fn in files:\n            p = os.path.join(cwd, fn)\n            if os.path.isfile(p):\n                try:\n                    df = load_xes_to_df(p)\n                    found[name] = df\n                    print(f\"Loaded {name} from {fn} with {len(df)} events.\")\n                    break\n                except Exception as e:\n                    print(f\"Failed to load {fn}: {e}\")\n    if not found:\n        print(\n            \"No known XES files found in current directory. Please place XES files locally.\"\n        )\n    return found\n\n\n# Build prefixes\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n        if len(df) == 0:\n            df = df.sort_values([\"case_id\", \"timestamp\"])\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        ts_ns = pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy()\n        ts = (ts_ns // 10**9).astype(np.int64)\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str).tolist()], dtype=np.int64\n        )\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            seq_acts = acts_ids[:k].tolist()\n            seq_feats = feats[:k]\n            target = int(acts_ids[k])\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": seq_acts,\n                    \"seq_feats\": seq_feats.copy(),\n                    \"target\": target,\n                    \"last_ts\": int(ts[k - 1]),\n                    \"next_ts\": int(ts[k]),\n                }\n            )\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n    ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n    for s in samples:\n        if s[\"seq_feats\"].shape[0] > 0:\n            s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n            s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    out = {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, preds_probs = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            preds_probs.append(probs.detach().cpu().numpy())\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys)\n    y_pred = np.array(preds_top1)\n    mask = y_true != pad_idx\n    y_true = y_true[mask]\n    y_pred = y_pred[mask]\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    probs_concat = (\n        np.concatenate(preds_probs, axis=0)\n        if len(preds_probs) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return avg_loss, acc, f1, top3, y_true, y_pred, probs_concat\n\n\ndef prepare_dataloaders(df, max_prefix_len=10, batch_size=128):\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm_samples(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm_samples(samples_train)\n            norm_samples(samples_val)\n            norm_samples(samples_test)\n    ds_train = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_val = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_test = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=True,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_test = DataLoader(\n        ds_test,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    return dl_train, dl_val, dl_test, act2id, pad_id\n\n\ndef train_model(\n    dl_train,\n    dl_val,\n    vocab_size,\n    pad_id,\n    num_layers=1,\n    hidden=128,\n    emb_dim=64,\n    cont_dim=5,\n    lr=1e-3,\n    max_epochs=10,\n    verbose=True,\n    dataset_key=None,\n    record_container=None,\n):\n    model = LSTMBaseline(\n        vocab_size=vocab_size,\n        emb_dim=emb_dim,\n        cont_dim=cont_dim,\n        hidden=hidden,\n        num_layers=num_layers,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n    best_val_top3 = -1.0\n    best_state = None\n    hist = {\n        \"train_loss\": [],\n        \"val_loss\": [],\n        \"val_acc\": [],\n        \"val_f1\": [],\n        \"val_top3\": [],\n    }\n    for epoch in range(1, max_epochs + 1):\n        model.train()\n        total = 0\n        running_loss = 0.0\n        for batch in dl_train:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            optimizer.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item() * logits.size(0)\n            total += logits.size(0)\n        train_loss = running_loss / max(1, total)\n        val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n            model, dl_val, criterion, device, vocab_size, pad_id\n        )\n        if verbose:\n            print(\n                f\"Epoch {epoch}: val_loss={val_loss:.4f} acc={val_acc:.4f} f1={val_f1:.4f} top3={val_top3:.4f}\"\n            )\n        hist[\"train_loss\"].append(train_loss)\n        hist[\"val_loss\"].append(val_loss)\n        hist[\"val_acc\"].append(val_acc)\n        hist[\"val_f1\"].append(val_f1)\n        hist[\"val_top3\"].append(val_top3)\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_state = {\n                k: v.detach().cpu().clone() for k, v in model.state_dict().items()\n            }\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n    return model, hist, best_val_top3\n\n\ndef run_experiment_on_dataset(name, df, max_prefix_len=10, batch_size=128, lr=1e-3):\n    print(f\"\\n=== Dataset: {name} ===\")\n    # cap to 5000 earliest cases for speed\n    try:\n        starts = (\n            df.sort_values(\"timestamp\")\n            .groupby(\"case_id\")[\"timestamp\"]\n            .min()\n            .reset_index()\n        )\n        if len(starts) > 5000:\n            keep_cases = set(starts.iloc[:5000][\"case_id\"])\n            df = df[df[\"case_id\"].isin(keep_cases)].copy()\n    except Exception:\n        pass\n\n    dl_train, dl_val, dl_test, act2id, pad_id = prepare_dataloaders(\n        df, max_prefix_len=max_prefix_len, batch_size=batch_size\n    )\n    vocab_size = len(act2id)\n    if vocab_size < 2:\n        print(\"Not enough activities to train. Skipping.\")\n        return\n\n    # Phase 1: Check if simply training longer helps (num_layers=1, epochs 10 vs 20)\n    longer_check = {}\n    for ep in [10, 20]:\n        print(f\"Longer-training check: epochs={ep}, num_layers=1\")\n        model_lc, hist_lc, best_val_top3_lc = train_model(\n            dl_train,\n            dl_val,\n            vocab_size,\n            pad_id,\n            num_layers=1,\n            hidden=128,\n            emb_dim=64,\n            cont_dim=5,\n            lr=lr,\n            max_epochs=ep,\n            verbose=True,\n        )\n        longer_check[ep] = {\n            \"history\": hist_lc,\n            \"best_val_top3\": best_val_top3_lc,\n        }\n\n    # Phase 2: Grid search over num_layers with fixed epochs=10\n    grid = [1, 2, 3]\n    results = {}\n    best_model = None\n    best_cfg = None\n    best_val_top3 = -1.0\n    fixed_epochs = 10\n    for nl in grid:\n        print(f\"Tuning num_layers={nl} for {fixed_epochs} epochs\")\n        model, hist, val_top3 = train_model(\n            dl_train,\n            dl_val,\n            vocab_size,\n            pad_id,\n            num_layers=nl,\n            hidden=128,\n            emb_dim=64,\n            cont_dim=5,\n            lr=lr,\n            max_epochs=fixed_epochs,\n            verbose=True,\n        )\n        results[nl] = {\"history\": hist, \"val_top3\": val_top3}\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_model = model\n            best_cfg = {\"num_layers\": nl, \"epochs\": fixed_epochs}\n\n    # Final evaluation on train/val/test with best model\n    criterion = nn.CrossEntropyLoss().to(device)\n    train_loss, train_acc, train_f1, train_top3, _, _, _ = evaluate(\n        best_model, dl_train, criterion, device, vocab_size, pad_id\n    )\n    val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n        best_model, dl_val, criterion, device, vocab_size, pad_id\n    )\n    test_loss, test_acc, test_f1, test_top3, y_true_t, y_pred_t, probs_t = evaluate(\n        best_model, dl_test, criterion, device, vocab_size, pad_id\n    )\n\n    # Store all data under required structure\n    if \"hyperparam_tuning_type_1\" not in experiment_data:\n        experiment_data[\"hyperparam_tuning_type_1\"] = {}\n    experiment_data[\"hyperparam_tuning_type_1\"][name] = {\n        \"settings\": {\n            \"hidden_size\": 128,\n            \"emb_dim\": 64,\n            \"lr\": lr,\n            \"batch_size\": batch_size,\n            \"max_prefix_len\": max_prefix_len,\n            \"grid_num_layers\": grid,\n            \"selection_metric\": \"val_top3\",\n            \"longer_training_epochs\": [10, 20],\n        },\n        \"longer_training_check\": longer_check,\n        \"grid_search\": results,\n        \"selected_model\": {\n            \"num_layers\": best_cfg[\"num_layers\"] if best_cfg else None,\n            \"epochs\": best_cfg[\"epochs\"] if best_cfg else None,\n            \"best_val_top3\": best_val_top3,\n        },\n        \"metrics\": {\n            \"train\": [\n                {\n                    \"loss\": train_loss,\n                    \"acc\": train_acc,\n                    \"macro_f1\": train_f1,\n                    \"top3\": train_top3,\n                }\n            ],\n            \"val\": [\n                {\"loss\": val_loss, \"acc\": val_acc, \"macro_f1\": val_f1, \"top3\": val_top3}\n            ],\n            \"test\": [\n                {\n                    \"loss\": test_loss,\n                    \"acc\": test_acc,\n                    \"macro_f1\": test_f1,\n                    \"top3\": test_top3,\n                }\n            ],\n        },\n        \"losses\": {\n            # for convenience, store final losses; full histories are in grid_search\n            \"train\": [train_loss],\n            \"val\": [val_loss],\n        },\n        \"predictions\": y_pred_t.tolist(),\n        \"ground_truth\": y_true_t.tolist(),\n        \"probs_shape\": list(probs_t.shape),\n    }\n    print(\n        f\"[{name}] Selected num_layers={best_cfg['num_layers']} | Test top-3={test_top3:.4f}, acc={test_acc:.4f}, f1={test_f1:.4f}\"\n    )\n\n\ndef main():\n    datasets = discover_datasets()\n    if not datasets:\n        # No datasets found; exit gracefully but still save empty structure\n        print(\"No datasets loaded. Saving empty experiment data.\")\n        np.save(\"experiment_data.npy\", experiment_data, allow_pickle=True)\n        return\n    for key, df in datasets.items():\n        try:\n            run_experiment_on_dataset(\n                key, df, max_prefix_len=10, batch_size=128, lr=1e-3\n            )\n        except Exception as e:\n            print(f\"Error on dataset {key}: {e}\")\n    # Save experiment data (single required file)\n    np.save(\"experiment_data.npy\", experiment_data, allow_pickle=True)\n    print(\"Saved experiment data to experiment_data.npy\")\n\n\nif __name__ == \"__main__\":\n    main()\n","plan":"Hyperparam tuning name: num_layers.\nI will replace the custom dataset loader with a pm4py-based XES loader, construct a prefix prediction dataset, and maintain the original LSTM baseline. First, I will run a sanity check to see if increasing epochs (from 10 to 20) for a 1-layer LSTM yields validation top-3 gains. Then, I will tune the LSTM depth over num_layers \u2208 {1, 2, 3} with hidden size fixed at 128 and select the best by validation top-3. Finally, I will evaluate the selected model on the test split and save all metrics, losses, predictions, and relevant metadata into a single experiment_data.npy under the required structure.","overall_plan":"","plot_code":null,"plot_plan":null,"step":9,"id":"658ae461b48144a5bce939113f629297","ctime":1757759688.4607246,"_term_out":["Using device: cuda","\n","Execution time: a moment seconds (time limit is an hour)."],"parse_metrics_plan":"","parse_metrics_code":"","parse_term_out":null,"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":0.572425365447998,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"The run produced no meaningful experiment output beyond the device line. There are strong indications the script did not discover or load any logs, so no training/evaluation occurred. Root causes and fixes:\n\n1) Dataset discovery bug: discover_datasets() only checks the current working directory for a few exact filenames (e.g., BPI_Challenge_2012.xes) and ignores the required ./input directory and .xes.gz files. In this environment, logs are under input/*.xes(.gz), so nothing was found. Fix: adopt the robust discovery from ai_scientist/ideas/my_research_topic.py or update discover_datasets() to search input/ and data/ with glob patterns: input/*.xes, input/*.xes.gz, and fuzzy matches for BPI2012/2017 and Road_Traffic_Fine_Management_Process.\n\n2) Stage rule violation: The baseline_tuning stage disallows changing the model architecture from the previous stage. The code performs a grid search over num_layers=[1,2,3], which changes the LSTM architecture if the prior baseline was 1 layer. Fix: keep num_layers fixed at the baseline (e.g., 1) and tune only permissible hyperparameters: learning rate, epochs, batch size, max_prefix_len, dropout, weight decay, and feature knobs (calendar windows), while preserving the model architecture.\n\n3) Missing required per-log evaluations: The goal requires evaluating at least BPI 2017 and ROAD logs. Due to discovery issues, these were not evaluated. Fix follows from (1); after discovery, ensure both logs are loaded and evaluated with time-based splits.\n\n4) Logging/outputs: The code should log dataset discovery, split sizes, training epochs, and final per-log metrics. The provided execution output shows none of these. Add explicit prints for dataset loading results and for saving experiment_data.npy to verify completion.\n\n5) Minor: Feature normalization occurs twice (once over all samples in build_prefix_dataset and again using train-only stats in prepare_dataloaders). This is redundant and introduces transient leakage before being overwritten. Fix: remove normalization in build_prefix_dataset and perform normalization solely using train statistics in prepare_dataloaders.\n\nImplementing these fixes should allow proper loading from ./input, adherence to the tuning constraints, and generation of required metrics (acc/macro-F1/top-3) for the next-activity task on BPI2017 and ROAD.","exp_results_dir":null,"metric":{"value":null,"maximize":null,"name":null,"description":null},"is_buggy":true,"is_buggy_plots":null,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":[],"plot_paths":[],"plot_analyses":[],"vlm_feedback_summary":[],"datasets_successfully_tested":[],"ablation_name":null,"hyperparam_name":"num_layers","is_seed_node":false,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"# Set random seed\nimport random\nimport numpy as np\nimport torch\n\nseed = 0\nrandom.seed(seed)\nnp.random.seed(seed)\ntorch.manual_seed(seed)\nif torch.cuda.is_available():\n    torch.cuda.manual_seed(seed)\n\nimport os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score\nimport random\nimport math\nimport matplotlib.pyplot as plt\n\n# Device handling (required)\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n# Experiment data structure\nexperiment_data = {\n    \"BPI2012\": {\n        \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n        \"losses\": {\"train\": [], \"val\": []},\n        \"predictions\": [],\n        \"ground_truth\": [],\n        \"epochs\": [],\n    },\n    \"BPI2017\": {\n        \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n        \"losses\": {\"train\": [], \"val\": []},\n        \"predictions\": [],\n        \"ground_truth\": [],\n        \"epochs\": [],\n    },\n    \"ROAD\": {\n        \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n        \"losses\": {\"train\": [], \"val\": []},\n        \"predictions\": [],\n        \"ground_truth\": [],\n        \"epochs\": [],\n    },\n}\n\n# Data loading utilities (use provided helper)\nfrom ai_scientist.ideas.my_research_topic import load_datasets, pick_default_dataset\n\n\n# Reproducibility\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# Build prefixes\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    # Keep only 'complete' transitions if lifecycle exists\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n        if len(df) == 0:\n            df = df.copy()  # fallback if empty\n            df = df.sort_values([\"case_id\", \"timestamp\"])\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    # Build activity vocab\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}  # 0 for PAD\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        # Convert to numpy arrays for safe positional indexing\n        ts_ns = (\n            pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy()\n        )  # nanoseconds\n        ts = (ts_ns // 10**9).astype(np.int64)  # seconds as numpy array\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str).tolist()], dtype=np.int64\n        )\n        # simple calendar features\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        # time deltas and since start in seconds\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(\n            np.float32\n        )  # [T,5]\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        # Generate prefixes of length k (min_prefix_len..min(max_prefix_len, T-1)); target = activity at position k\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            seq_acts = acts_ids[:k].tolist()\n            seq_feats = feats[:k]\n            target = int(acts_ids[k])\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": seq_acts,\n                    \"seq_feats\": seq_feats.copy(),\n                    \"target\": target,\n                    \"last_ts\": int(ts[k - 1]),\n                    \"next_ts\": int(ts[k]),\n                }\n            )\n\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n\n    # Collect feature normalization stats over all feats (initial; will be recomputed on train split)\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n    ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n    for s in samples:\n        if s[\"seq_feats\"].shape[0] > 0:\n            s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n            s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\n# Time-based split by case start time\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)  # includes PAD index\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)  # [B,T,emb]\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    out = {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, preds_probs = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            preds_probs.append(probs.detach().cpu().numpy())\n            # top-3 correctness\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys)\n    y_pred = np.array(preds_top1)\n    mask = y_true != pad_idx\n    y_true = y_true[mask]\n    y_pred = y_pred[mask]\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    probs_concat = (\n        np.concatenate(preds_probs, axis=0)\n        if len(preds_probs) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return avg_loss, acc, f1, top3, y_true, y_pred, probs_concat\n\n\ndef train_one_dataset(\n    name, df, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n):\n    print(f\"\\n=== Dataset: {name} ===\")\n    # Time-based split\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    # Build samples across all to get vocab; we'll re-normalize with train stats\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    # Filter per split\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # Recompute normalization using train samples only\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm_samples(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm_samples(samples_train)\n            norm_samples(samples_val)\n            norm_samples(samples_test)\n    print(\n        f\"Samples train/val/test: {len(samples_train)}/{len(samples_val)}/{len(samples_test)}; vocab={len(act2id)}\"\n    )\n    if len(samples_train) == 0 or len(act2id) < 2:\n        print(\"Not enough data to train. Skipping.\")\n        return\n    ds_train = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_val = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_test = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=True,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_test = DataLoader(\n        ds_test,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n\n    # Model\n    model = LSTMBaseline(\n        vocab_size=len(act2id),\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    # Training loop\n    best_val_top3 = -1.0\n    best_state = None\n    hist = {\"train_loss\": [], \"val_loss\": [], \"val_top3\": []}\n    for epoch in range(1, max_epochs + 1):\n        model.train()\n        total = 0\n        running_loss = 0.0\n        for batch in dl_train:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            optimizer.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item() * logits.size(0)\n            total += logits.size(0)\n        train_loss = running_loss / max(1, total)\n        val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n            model, dl_val, criterion, device, len(act2id), pad_id\n        )\n        print(\n            f\"Epoch {epoch}: validation_loss = {val_loss:.4f} | val_acc={val_acc:.4f} | val_f1={val_f1:.4f} | val_top3={val_top3:.4f}\"\n        )\n        hist[\"train_loss\"].append(train_loss)\n        hist[\"val_loss\"].append(val_loss)\n        hist[\"val_top3\"].append(val_top3)\n        experiment_data[name][\"losses\"][\"train\"].append((epoch, train_loss))\n        experiment_data[name][\"losses\"][\"val\"].append((epoch, val_loss))\n        experiment_data[name][\"metrics\"][\"val\"].append(\n            (epoch, {\"acc\": val_acc, \"macro_f1\": val_f1, \"top3\": val_top3})\n        )\n        experiment_data[name][\"epochs\"].append(epoch)\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_state = {k: v.cpu().clone() for k, v in model.state_dict().items()}\n\n    # Load best\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n\n    # Final eval on train/val/test\n    train_loss, train_acc, train_f1, train_top3, _, _, _ = evaluate(\n        model, dl_train, criterion, device, len(act2id), pad_id\n    )\n    val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n        model, dl_val, criterion, device, len(act2id), pad_id\n    )\n    test_loss, test_acc, test_f1, test_top3, y_true_t, y_pred_t, probs_t = evaluate(\n        model, dl_test, criterion, device, len(act2id), pad_id\n    )\n    print(\n        f\"[{name}] Train: loss={train_loss:.4f} acc={train_acc:.4f} f1={train_f1:.4f} top3={train_top3:.4f}\"\n    )\n    print(\n        f\"[{name}] Test:  loss={test_loss:.4f} acc={test_acc:.4f} f1={test_f1:.4f} top3={test_top3:.4f}\"\n    )\n\n    # Save metrics\n    experiment_data[name][\"metrics\"][\"train\"].append(\n        (\n            \"final\",\n            {\n                \"loss\": train_loss,\n                \"acc\": train_acc,\n                \"macro_f1\": train_f1,\n                \"top3\": train_top3,\n            },\n        )\n    )\n    experiment_data[name][\"metrics\"][\"val\"].append(\n        (\n            \"final\",\n            {\"loss\": val_loss, \"acc\": val_acc, \"macro_f1\": val_f1, \"top3\": val_top3},\n        )\n    )\n    experiment_data[name][\"metrics\"][\"test\"].append(\n        (\n            \"final\",\n            {\n                \"loss\": test_loss,\n                \"acc\": test_acc,\n                \"macro_f1\": test_f1,\n                \"top3\": test_top3,\n            },\n        )\n    )\n    experiment_data[name][\"predictions\"] = y_pred_t.tolist()\n    experiment_data[name][\"ground_truth\"] = y_true_t.tolist()\n\n    # Plots\n    try:\n        plt.figure()\n        plt.plot(hist[\"train_loss\"], label=\"train_loss\")\n        plt.plot(hist[\"val_loss\"], label=\"val_loss\")\n        plt.legend()\n        plt.title(f\"Loss Curves - {name}\")\n        plt.xlabel(\"Epoch\")\n        plt.ylabel(\"Loss\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"loss_curves_{name}.png\"))\n        plt.close()\n\n        plt.figure()\n        plt.plot(hist[\"val_top3\"], label=\"val_top3\")\n        plt.legend()\n        plt.title(f\"Val Top-3 Acc - {name}\")\n        plt.xlabel(\"Epoch\")\n        plt.ylabel(\"Top-3 Acc\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"val_top3_{name}.png\"))\n        plt.close()\n    except Exception as e:\n        print(f\"[warn] Plotting failed: {e}\")\n\n    # Save confusion matrix-like data (optional)\n    try:\n        from sklearn.metrics import confusion_matrix\n\n        cm = confusion_matrix(y_true_t, y_pred_t)\n        np.save(os.path.join(working_dir, f\"cm_{name}.npy\"), cm)\n    except Exception as e:\n        print(f\"[warn] Confusion matrix failed: {e}\")\n\n\ndef main():\n    datasets = load_datasets()\n    # Loop through loaded datasets; cap to 5000 earliest cases for speed\n    for key, df in datasets.items():\n        try:\n            starts = (\n                df.sort_values(\"timestamp\")\n                .groupby(\"case_id\")[\"timestamp\"]\n                .min()\n                .reset_index()\n            )\n            if len(starts) > 5000:\n                keep_cases = set(starts.iloc[:5000][\"case_id\"])\n                df_small = df[df[\"case_id\"].isin(keep_cases)].copy()\n            else:\n                df_small = df\n        except Exception:\n            df_small = df\n        train_one_dataset(\n            key, df_small, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n        )\n    # Save experiment data\n    np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n    np.savez_compressed(\n        os.path.join(working_dir, \"experiment_data_compressed.npz\"),\n        data=experiment_data,\n    )\n\n\n# Execute immediately\nmain()\n","plan":"Seed node","overall_plan":"","plot_code":"import matplotlib.pyplot as plt\nimport numpy as np\nimport os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import (\n    f1_score,\n    accuracy_score,\n    confusion_matrix,\n    precision_recall_curve,\n    average_precision_score,\n)\nfrom sklearn.preprocessing import label_binarize\nimport random\nimport math\nfrom collections import defaultdict\n\n# Reproducibility and device\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# --------- Data loading from local XES via pm4py ----------\ndef load_xes_folder(data_dir=\"data\"):\n    datasets = {}\n    try:\n        import pm4py\n    except Exception as e:\n        print(f\"pm4py not available: {e}\")\n        return datasets\n    if not os.path.isdir(data_dir):\n        print(f\"Data directory not found: {data_dir}\")\n        return datasets\n    for fn in os.listdir(data_dir):\n        if fn.lower().endswith(\".xes\") or fn.lower().endswith(\".xes.gz\"):\n            path = os.path.join(data_dir, fn)\n            try:\n                log = pm4py.read_xes(path)\n                df = pm4py.convert_to_dataframe(log)\n                # Standardize columns\n                # pm4py dataframe typically has case:concept:name, concept:name, time:timestamp, lifecycle:transition\n                cols = df.columns\n                case_col = (\n                    \"case:concept:name\"\n                    if \"case:concept:name\" in cols\n                    else (\"case\" if \"case\" in cols else None)\n                )\n                act_col = (\n                    \"concept:name\"\n                    if \"concept:name\" in cols\n                    else (\"activity\" if \"activity\" in cols else None)\n                )\n                ts_col = (\n                    \"time:timestamp\"\n                    if \"time:timestamp\" in cols\n                    else (\"timestamp\" if \"timestamp\" in cols else None)\n                )\n                life_col = (\n                    \"lifecycle:transition\"\n                    if \"lifecycle:transition\" in cols\n                    else (\"lifecycle\" if \"lifecycle\" in cols else None)\n                )\n                if case_col is None or act_col is None or ts_col is None:\n                    print(f\"Missing required columns in {fn}, skipping.\")\n                    continue\n                out = pd.DataFrame(\n                    {\n                        \"case_id\": df[case_col].astype(str).values,\n                        \"activity\": df[act_col].astype(str).values,\n                        \"timestamp\": pd.to_datetime(df[ts_col], utc=True),\n                    }\n                )\n                if life_col is not None:\n                    out[\"lifecycle\"] = df[life_col].astype(str).values\n                name = os.path.splitext(fn)[0]\n                datasets[name] = out\n                print(\n                    f\"Loaded {name}: {len(out)} events, {out['case_id'].nunique()} cases\"\n                )\n            except Exception as e:\n                print(f\"Failed to load {fn}: {e}\")\n    return datasets\n\n\n# --------- Prefix building and split ----------\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        mask = df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")\n        if mask.any():\n            df = df[mask]\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        if len(g) < 2:\n            continue\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        ts = (g_ts.astype(\"int64\") // 10**9).to_numpy(np.int64)\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str)], dtype=np.int64\n        )\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": acts_ids[:k].tolist(),\n                    \"seq_feats\": feats[:k].copy(),\n                    \"target\": int(acts_ids[k]),\n                    \"prefix_len\": k,\n                }\n            )\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    for s in samples:\n        pass  # initial no norm; will norm on train split\n    return samples, act2id, id2act, pad_id\n\n\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.vstack(\n            [\n                np.zeros((pad_len, self.num_cont), dtype=np.float32),\n                feats.astype(np.float32),\n            ]\n        )\n        attn = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad).long(),\n            \"feats\": torch.tensor(feats_pad).float(),\n            \"mask\": torch.tensor(attn).float(),\n            \"y\": torch.tensor(s[\"target\"]).long(),\n            \"prefix_len\": L,\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, pad_idx=0):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim, hidden_size=hidden, batch_first=True\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h = self.dropout(h[-1])\n        return self.fc(h)\n\n\ndef collate_fn(batch):\n    out = {\n        k: (\n            torch.stack([b[k] for b in batch], 0)\n            if isinstance(batch[0][k], torch.Tensor)\n            else [b[k] for b in batch]\n        )\n        for k in batch[0].keys()\n    }\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys = []\n    yhat = []\n    probs_list = []\n    n = 0\n    top3_correct = 0\n    pref_lens = []\n    top3_flags = []\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) if isinstance(v, torch.Tensor) else v\n                for k, v in batch.items()\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk = torch.topk(probs, k=k_val, dim=1)\n            y = batch[\"y\"]\n            ys.extend(y.detach().cpu().tolist())\n            yhat.extend(top1.detach().cpu().tolist())\n            probs_list.append(probs.detach().cpu().numpy())\n            for i in range(y.size(0)):\n                flag = int(y[i].item() in topk[i].detach().cpu().tolist())\n                top3_correct += flag\n                top3_flags.append(flag)\n                pref_lens.append(int(batch[\"prefix_len\"][i].item()))\n            n += y.size(0)\n    avg_loss = total_loss / max(1, n)\n    y_true = np.array(ys)\n    y_pred = np.array(yhat)\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n))\n    probs_concat = (\n        np.concatenate(probs_list, axis=0)\n        if len(probs_list) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return (\n        avg_loss,\n        acc,\n        f1,\n        top3,\n        y_true,\n        y_pred,\n        probs_concat,\n        np.array(pref_lens),\n        np.array(top3_flags),\n    )\n\n\ndef train_on_dataset(\n    name, df, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n):\n    print(f\"\\n=== Dataset: {name} ===\")\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    s_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    s_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    s_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # normalize time features on train\n    if len(s_train) > 0:\n        feats = np.concatenate(\n            [s[\"seq_feats\"] for s in s_train if len(s[\"seq_feats\"]) > 0], axis=0\n        )\n        dt_mean, dt_std = feats[:, 0].mean(), feats[:, 0].std() + 1e-6\n        ss_mean, ss_std = feats[:, 1].mean(), feats[:, 1].std() + 1e-6\n\n        def norm(samples):\n            for s in samples:\n                if s[\"seq_feats\"].shape[0] > 0:\n                    s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                    s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n        norm(s_train)\n        norm(s_val)\n        norm(s_test)\n    print(\n        f\"Samples train/val/test: {len(s_train)}/{len(s_val)}/{len(s_test)}; vocab={len(act2id)}\"\n    )\n    if len(s_train) == 0 or len(act2id) < 2:\n        print(\"Insufficient data; skipping.\")\n        return None\n    ds_tr = PrefixDataset(s_train, pad_id, max_prefix_len, 5)\n    ds_va = PrefixDataset(s_val, pad_id, max_prefix_len, 5)\n    ds_te = PrefixDataset(s_test, pad_id, max_prefix_len, 5)\n    dl_tr = DataLoader(\n        ds_tr, batch_size=batch_size, shuffle=True, collate_fn=collate_fn\n    )\n    dl_va = DataLoader(\n        ds_va, batch_size=batch_size, shuffle=False, collate_fn=collate_fn\n    )\n    dl_te = DataLoader(\n        ds_te, batch_size=batch_size, shuffle=False, collate_fn=collate_fn\n    )\n    model = LSTMBaseline(\n        vocab_size=len(act2id), emb_dim=64, cont_dim=5, hidden=128, pad_idx=pad_id\n    ).to(device)\n    crit = nn.CrossEntropyLoss().to(device)\n    opt = torch.optim.Adam(model.parameters(), lr=lr)\n    best_top3 = -1.0\n    best_state = None\n    history = {\"train_loss\": [], \"val_loss\": [], \"val_top3\": []}\n    for ep in range(1, max_epochs + 1):\n        model.train()\n        tot = 0\n        run_loss = 0.0\n        for batch in dl_tr:\n            batch = {\n                k: v.to(device) if isinstance(v, torch.Tensor) else v\n                for k, v in batch.items()\n            }\n            opt.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = crit(logits, batch[\"y\"])\n            loss.backward()\n            opt.step()\n            run_loss += loss.item() * logits.size(0)\n            tot += logits.size(0)\n        tr_loss = run_loss / max(1, tot)\n        va_loss, va_acc, va_f1, va_top3, *_ = evaluate(\n            model, dl_va, crit, device, len(act2id), pad_id\n        )\n        print(\n            f\"Epoch {ep}: val_loss={va_loss:.4f} acc={va_acc:.4f} f1={va_f1:.4f} top3={va_top3:.4f}\"\n        )\n        history[\"train_loss\"].append(tr_loss)\n        history[\"val_loss\"].append(va_loss)\n        history[\"val_top3\"].append(va_top3)\n        if va_top3 > best_top3:\n            best_top3 = va_top3\n            best_state = {\n                k: v.detach().cpu().clone() for k, v in model.state_dict().items()\n            }\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n    tr_loss, tr_acc, tr_f1, tr_top3, *_ = evaluate(\n        model, dl_tr, crit, device, len(act2id), pad_id\n    )\n    te_loss, te_acc, te_f1, te_top3, y_true, y_pred, probs, pref_lens, top3_flags = (\n        evaluate(model, dl_te, crit, device, len(act2id), pad_id)\n    )\n    print(\n        f\"[{name}] Test: loss={te_loss:.4f} acc={te_acc:.4f} f1={te_f1:.4f} top3={te_top3:.4f}\"\n    )\n    # package experiment data\n    exp = {\n        \"metrics\": {\n            \"train\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": tr_loss,\n                        \"acc\": tr_acc,\n                        \"macro_f1\": tr_f1,\n                        \"top3\": tr_top3,\n                    },\n                )\n            ],\n            \"val\": [],\n            \"test\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": te_loss,\n                        \"acc\": te_acc,\n                        \"macro_f1\": te_f1,\n                        \"top3\": te_top3,\n                    },\n                )\n            ],\n        },\n        \"losses\": {\n            \"train\": list(enumerate(history[\"train_loss\"], start=1)),\n            \"val\": list(enumerate(history[\"val_loss\"], start=1)),\n        },\n        \"predictions\": y_pred.tolist(),\n        \"ground_truth\": y_true.tolist(),\n        \"epochs\": list(range(1, len(history[\"train_loss\"]) + 1)),\n        \"probs\": probs,\n        \"prefix_lens\": pref_lens.tolist(),\n        \"top3_flags\": top3_flags.tolist(),\n        \"act2id\": act2id,\n    }\n    # plots for this dataset\n    try:\n        plt.figure()\n        plt.plot(history[\"train_loss\"], label=\"train\")\n        plt.plot(history[\"val_loss\"], label=\"val\")\n        plt.legend()\n        plt.title(f\"Loss Curves - {name}\")\n        plt.xlabel(\"Epoch\")\n        plt.ylabel(\"Loss\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"{name}_loss_curves.png\"))\n        plt.close()\n    except Exception as e:\n        print(f\"Error creating loss curves for {name}: {e}\")\n        plt.close()\n    try:\n        cm = confusion_matrix(y_true, y_pred)\n        plt.figure(figsize=(5, 4))\n        plt.imshow(cm, aspect=\"auto\", cmap=\"Blues\")\n        plt.colorbar()\n        plt.title(f\"Confusion Matrix (Test) - {name}\\nNext-activity\")\n        plt.xlabel(\"Predicted\")\n        plt.ylabel(\"True\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"{name}_confusion_matrix.png\"))\n        plt.close()\n    except Exception as e:\n        print(f\"Error creating confusion matrix for {name}: {e}\")\n        plt.close()\n    try:\n        # Top-3 accuracy vs prefix length\n        if len(pref_lens) > 0:\n            d = defaultdict(list)\n            for L, flag in zip(pref_lens, top3_flags):\n                d[int(L)].append(int(flag))\n            xs = sorted(d.keys())\n            ys = [np.mean(d[k]) for k in xs]\n            plt.figure()\n            plt.plot(xs, ys, marker=\"o\")\n            plt.title(f\"Top-3 Accuracy vs Prefix Length - {name}\\nNext-activity\")\n            plt.xlabel(\"Prefix Length\")\n            plt.ylabel(\"Top-3 Accuracy\")\n            plt.tight_layout()\n            plt.savefig(os.path.join(working_dir, f\"{name}_top3_vs_prefixlen.png\"))\n            plt.close()\n    except Exception as e:\n        print(f\"Error creating Top-3 vs prefix length for {name}: {e}\")\n        plt.close()\n    try:\n        # Macro PR curve (one-vs-rest); may be coarse due to many classes\n        if probs.shape[0] > 0:\n            classes = np.unique(y_true)\n            Y = label_binarize(y_true, classes=range(probs.shape[1]))\n            # only keep columns present in classes to avoid PAD\n            present = [c for c in classes]\n            if len(present) > 1:\n                precisions = []\n                recalls = []\n                aps = []\n                for c in present:\n                    p, r, _ = precision_recall_curve(Y[:, c], probs[:, c])\n                    ap = average_precision_score(Y[:, c], probs[:, c])\n                    precisions.append(\n                        np.interp(np.linspace(0, 1, 101), r[::-1], p[::-1])\n                    )\n                    recalls.append(np.linspace(0, 1, 101))\n                    aps.append(ap)\n                macro_p = np.mean(np.stack(precisions, 0), 0)\n                macro_r = np.linspace(0, 1, 101)\n                plt.figure()\n                plt.plot(macro_r, macro_p, label=f\"Macro-PR (mAP={np.mean(aps):.3f})\")\n                plt.title(f\"Macro Precision-Recall (Test) - {name}\\nNext-activity\")\n                plt.xlabel(\"Recall\")\n                plt.ylabel(\"Precision\")\n                plt.legend()\n                plt.tight_layout()\n                plt.savefig(os.path.join(working_dir, f\"{name}_macro_pr.png\"))\n                plt.close()\n    except Exception as e:\n        print(f\"Error creating PR curve for {name}: {e}\")\n        plt.close()\n    return name, exp\n\n\ndef main():\n    datasets = load_xes_folder(data_dir=os.path.join(os.getcwd(), \"data\"))\n    experiment_data = {}\n    for name, df in datasets.items():\n        # optional cap earliest 5000 cases\n        try:\n            starts = (\n                df.sort_values(\"timestamp\")\n                .groupby(\"case_id\")[\"timestamp\"]\n                .min()\n                .reset_index()\n            )\n            if len(starts) > 5000:\n                keep = set(starts.iloc[:5000][\"case_id\"])\n                df = df[df[\"case_id\"].isin(keep)].copy()\n        except:\n            pass\n        res = train_on_dataset(\n            name, df, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n        )\n        if res is not None:\n            k, exp = res\n            experiment_data[k] = exp\n    # Save experiment data\n    np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n    # Print evaluation metrics\n    for k, v in experiment_data.items():\n        test_metrics = dict(v[\"metrics\"][\"test\"][0][1])\n        print(\n            f\"{k} | Test acc={test_metrics['acc']:.4f} macro_f1={test_metrics['macro_f1']:.4f} top3={test_metrics['top3']:.4f} loss={test_metrics['loss']:.4f}\"\n        )\n\n    # Secondary plotting pass strictly from experiment_data.npy (as required)\n    try:\n        experiment_data_loaded = np.load(\n            os.path.join(working_dir, \"experiment_data.npy\"), allow_pickle=True\n        ).item()\n    except Exception as e:\n        print(f\"Error loading experiment data: {e}\")\n        experiment_data_loaded = {}\n    for name, ed in experiment_data_loaded.items():\n        try:\n            # re-plot loss curves from saved data\n            plt.figure()\n            tl = [y for (_, y) in ed.get(\"losses\", {}).get(\"train\", [])]\n            vl = [y for (_, y) in ed.get(\"losses\", {}).get(\"val\", [])]\n            if len(tl) > 0:\n                plt.plot(tl, label=\"train\")\n            if len(vl) > 0:\n                plt.plot(vl, label=\"val\")\n            plt.legend()\n            plt.title(f\"Loss Curves - {name}\\nNext-activity\")\n            plt.xlabel(\"Epoch\")\n            plt.ylabel(\"Loss\")\n            plt.tight_layout()\n            plt.savefig(os.path.join(working_dir, f\"{name}_loss_curves_reload.png\"))\n            plt.close()\n        except Exception as e:\n            print(f\"Error creating plot1: {e}\")\n            plt.close()\n        try:\n            # confusion matrix from predictions and ground truth\n            y_true = ed.get(\"ground_truth\", [])\n            y_pred = ed.get(\"predictions\", [])\n            if len(y_true) > 0 and len(y_pred) > 0:\n                cm = confusion_matrix(y_true, y_pred)\n                plt.figure(figsize=(5, 4))\n                plt.imshow(cm, aspect=\"auto\", cmap=\"Blues\")\n                plt.colorbar()\n                plt.title(f\"Confusion Matrix (Test) - {name}\\nNext-activity\")\n                plt.xlabel(\"Predicted\")\n                plt.ylabel(\"True\")\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(working_dir, f\"{name}_confusion_matrix_reload.png\")\n                )\n                plt.close()\n        except Exception as e:\n            print(f\"Error creating plot2: {e}\")\n            plt.close()\n        try:\n            # Top-3 vs prefix length if present\n            pref = ed.get(\"prefix_lens\", [])\n            flags = ed.get(\"top3_flags\", [])\n            if len(pref) > 0 and len(flags) > 0:\n                d = defaultdict(list)\n                for L, f in zip(pref, flags):\n                    d[int(L)].append(int(f))\n                xs = sorted(d.keys())\n                ys = [float(np.mean(d[x])) for x in xs]\n                plt.figure()\n                plt.plot(xs, ys, marker=\"o\")\n                plt.title(f\"Top-3 Accuracy vs Prefix Length - {name}\\nNext-activity\")\n                plt.xlabel(\"Prefix Length\")\n                plt.ylabel(\"Top-3 Accuracy\")\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(working_dir, f\"{name}_top3_vs_prefixlen_reload.png\")\n                )\n                plt.close()\n        except Exception as e:\n            print(f\"Error creating plot3: {e}\")\n            plt.close()\n        try:\n            # Macro PR curve if probs available\n            probs = np.array(ed.get(\"probs\", []))\n            y_true = ed.get(\"ground_truth\", [])\n            if probs.size > 0 and len(y_true) > 0:\n                classes = sorted(set(y_true))\n                Y = label_binarize(np.array(y_true), classes=range(probs.shape[1]))\n                present = classes\n                if len(present) > 1:\n                    precisions = []\n                    aps = []\n                    grid = np.linspace(0, 1, 101)\n                    for c in present:\n                        p, r, _ = precision_recall_curve(Y[:, c], probs[:, c])\n                        precisions.append(np.interp(grid, r[::-1], p[::-1]))\n                        aps.append(average_precision_score(Y[:, c], probs[:, c]))\n                    macro_p = np.mean(np.stack(precisions, 0), 0)\n                    plt.figure()\n                    plt.plot(grid, macro_p, label=f\"mAP={np.mean(aps):.3f}\")\n                    plt.title(f\"Macro Precision-Recall (Test) - {name}\\nNext-activity\")\n                    plt.xlabel(\"Recall\")\n                    plt.ylabel(\"Precision\")\n                    plt.legend()\n                    plt.tight_layout()\n                    plt.savefig(\n                        os.path.join(working_dir, f\"{name}_macro_pr_reload.png\")\n                    )\n                    plt.close()\n        except Exception as e:\n            print(f\"Error creating plot4: {e}\")\n            plt.close()\n\n\nif __name__ == \"__main__\":\n    main()\n","plot_plan":null,"step":10,"id":"26f8c955090b4c65877fc01f0de569ba","ctime":1757762453.9800456,"_term_out":["Using device: cuda","\n","[data] Using discovered data dir: /workspace/data","\n","[data] Available in /workspace/data: ['BPI_Challenge_2012.xes', 'BPI_Challenge_2017.xes', 'Road_Traffic_Fine_Management_Process.xes']","\n","[data] Loading XES: /workspace/data/BPI_Challenge_2012.xes","\n","\rparsing log, completed traces ::   0%|          | 0/13087 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 1/13087 [00:00<22:23,  9.74it/s]","\rparsing log, completed traces ::   1%|1         | 157/13087 [00:00<00:14, 908.50it/s]","\rparsing log, completed traces ::   2%|2         | 315/13087 [00:00<00:10, 1209.92it/s]","\rparsing log, completed traces ::   3%|3         | 437/13087 [00:00<00:24, 511.41it/s] ","\rparsing log, completed traces ::   5%|4         | 602/13087 [00:00<00:17, 728.83it/s]","\rparsing log, completed traces ::   6%|6         | 790/13087 [00:00<00:12, 975.17it/s]","\rparsing log, completed traces ::   7%|7         | 938/13087 [00:01<00:11, 1093.30it/s]","\rparsing log, completed traces ::   8%|8         | 1100/13087 [00:01<00:09, 1222.79it/s]","\rparsing log, completed traces ::  10%|9         | 1272/13087 [00:01<00:08, 1351.01it/s]","\rparsing log, completed traces ::  11%|#1        | 1478/13087 [00:01<00:07, 1536.76it/s]","\rparsing log, completed traces ::  13%|#2        | 1656/13087 [00:01<00:07, 1600.59it/s]","\rparsing log, completed traces ::  14%|#3        | 1829/13087 [00:01<00:06, 1637.06it/s]","\rparsing log, completed traces ::  15%|#5        | 2001/13087 [00:01<00:06, 1631.41it/s]","\rparsing log, completed traces ::  17%|#6        | 2170/13087 [00:01<00:06, 1638.99it/s]","\rparsing log, completed traces ::  18%|#7        | 2344/13087 [00:01<00:06, 1664.53it/s]","\rparsing log, completed traces ::  19%|#9        | 2524/13087 [00:01<00:06, 1702.51it/s]","\rparsing log, completed traces ::  21%|##        | 2697/13087 [00:02<00:06, 1683.67it/s]","\rparsing log, completed traces ::  22%|##1       | 2867/13087 [00:02<00:06, 1639.10it/s]","\rparsing log, completed traces ::  23%|##3       | 3033/13087 [00:02<00:12, 830.13it/s] ","\rparsing log, completed traces ::  24%|##4       | 3184/13087 [00:02<00:10, 947.23it/s]","\rparsing log, completed traces ::  26%|##6       | 3438/13087 [00:02<00:07, 1261.22it/s]","\rparsing log, completed traces ::  28%|##7       | 3628/13087 [00:02<00:06, 1400.71it/s]","\rparsing log, completed traces ::  29%|##9       | 3804/13087 [00:03<00:06, 1475.49it/s]","\rparsing log, completed traces ::  31%|###       | 3996/13087 [00:03<00:05, 1586.01it/s]","\rparsing log, completed traces ::  33%|###2      | 4269/13087 [00:03<00:04, 1877.69it/s]","\rparsing log, completed traces ::  34%|###4      | 4475/13087 [00:03<00:04, 1903.65it/s]","\rparsing log, completed traces ::  36%|###5      | 4689/13087 [00:03<00:04, 1967.87it/s]","\rparsing log, completed traces ::  37%|###7      | 4896/13087 [00:03<00:04, 1926.85it/s]","\rparsing log, completed traces ::  39%|###8      | 5096/13087 [00:03<00:04, 1904.36it/s]","\rparsing log, completed traces ::  40%|####      | 5292/13087 [00:03<00:04, 1865.22it/s]","\rparsing log, completed traces ::  42%|####1     | 5482/13087 [00:03<00:04, 1773.17it/s]","\rparsing log, completed traces ::  43%|####3     | 5663/13087 [00:04<00:04, 1705.48it/s]","\rparsing log, completed traces ::  45%|####4     | 5836/13087 [00:04<00:04, 1686.30it/s]","\rparsing log, completed traces ::  46%|####6     | 6030/13087 [00:04<00:04, 1753.80it/s]","\rparsing log, completed traces ::  47%|####7     | 6207/13087 [00:04<00:04, 1716.92it/s]","\rparsing log, completed traces ::  49%|####9     | 6414/13087 [00:04<00:03, 1808.38it/s]","\rparsing log, completed traces ::  50%|#####     | 6596/13087 [00:04<00:07, 881.99it/s] ","\rparsing log, completed traces ::  52%|#####1    | 6764/13087 [00:04<00:06, 1010.92it/s]","\rparsing log, completed traces ::  53%|#####2    | 6911/13087 [00:05<00:05, 1095.48it/s]","\rparsing log, completed traces ::  54%|#####4    | 7079/13087 [00:05<00:04, 1219.43it/s]","\rparsing log, completed traces ::  55%|#####5    | 7252/13087 [00:05<00:04, 1338.15it/s]","\rparsing log, completed traces ::  57%|#####6    | 7411/13087 [00:05<00:04, 1371.99it/s]","\rparsing log, completed traces ::  58%|#####7    | 7566/13087 [00:05<00:03, 1397.85it/s]","\rparsing log, completed traces ::  59%|#####8    | 7719/13087 [00:05<00:03, 1424.57it/s]","\rparsing log, completed traces ::  60%|######    | 7887/13087 [00:05<00:03, 1481.37it/s]","\rparsing log, completed traces ::  61%|######1   | 8042/13087 [00:05<00:03, 1488.30it/s]","\rparsing log, completed traces ::  63%|######2   | 8221/13087 [00:05<00:03, 1569.83it/s]","\rparsing log, completed traces ::  64%|######4   | 8385/13087 [00:06<00:02, 1584.60it/s]","\rparsing log, completed traces ::  65%|######5   | 8556/13087 [00:06<00:02, 1617.87it/s]","\rparsing log, completed traces ::  67%|######6   | 8727/13087 [00:06<00:02, 1643.29it/s]","\rparsing log, completed traces ::  68%|######7   | 8893/13087 [00:06<00:02, 1608.59it/s]","\rparsing log, completed traces ::  69%|######9   | 9055/13087 [00:06<00:02, 1578.70it/s]","\rparsing log, completed traces ::  71%|#######   | 9228/13087 [00:06<00:02, 1622.05it/s]","\rparsing log, completed traces ::  72%|#######1  | 9406/13087 [00:06<00:02, 1665.62it/s]","\rparsing log, completed traces ::  73%|#######3  | 9574/13087 [00:06<00:02, 1562.02it/s]","\rparsing log, completed traces ::  74%|#######4  | 9739/13087 [00:06<00:02, 1584.55it/s]","\rparsing log, completed traces ::  76%|#######5  | 9915/13087 [00:06<00:01, 1627.16it/s]","\rparsing log, completed traces ::  77%|#######7  | 10079/13087 [00:07<00:04, 743.03it/s]","\rparsing log, completed traces ::  78%|#######8  | 10226/13087 [00:07<00:03, 857.96it/s]","\rparsing log, completed traces ::  79%|#######9  | 10393/13087 [00:07<00:02, 1007.99it/s]","\rparsing log, completed traces ::  80%|########  | 10535/13087 [00:07<00:02, 1063.43it/s]","\rparsing log, completed traces ::  82%|########1 | 10698/13087 [00:07<00:02, 1190.00it/s]","\rparsing log, completed traces ::  83%|########3 | 10883/13087 [00:07<00:01, 1348.51it/s]","\rparsing log, completed traces ::  85%|########4 | 11065/13087 [00:08<00:01, 1468.91it/s]","\rparsing log, completed traces ::  86%|########5 | 11229/13087 [00:08<00:01, 1513.39it/s]","\rparsing log, completed traces ::  87%|########7 | 11437/13087 [00:08<00:00, 1669.76it/s]","\rparsing log, completed traces ::  89%|########8 | 11614/13087 [00:08<00:00, 1675.45it/s]","\rparsing log, completed traces ::  90%|######### | 11823/13087 [00:08<00:00, 1793.11it/s]","\rparsing log, completed traces ::  92%|#########1| 12011/13087 [00:08<00:00, 1817.08it/s]","\rparsing log, completed traces ::  93%|#########3| 12207/13087 [00:08<00:00, 1858.74it/s]","\rparsing log, completed traces ::  95%|#########4| 12404/13087 [00:08<00:00, 1885.01it/s]","\rparsing log, completed traces ::  96%|#########6| 12614/13087 [00:08<00:00, 1947.23it/s]","\rparsing log, completed traces ::  98%|#########7| 12811/13087 [00:08<00:00, 1918.72it/s]","\rparsing log, completed traces ::  99%|#########9| 13012/13087 [00:09<00:00, 1945.31it/s]","","\rparsing log, completed traces :: 100%|##########| 13087/13087 [00:09<00:00, 1433.12it/s]","\n","[data] Loading XES: /workspace/data/BPI_Challenge_2017.xes","\n","\rparsing log, completed traces ::   0%|          | 0/31509 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 1/31509 [00:00<4:42:18,  1.86it/s]","\rparsing log, completed traces ::   0%|          | 68/31509 [00:00<03:42, 141.53it/s]","\rparsing log, completed traces ::   0%|          | 125/31509 [00:00<02:10, 239.79it/s]","\rparsing log, completed traces ::   1%|          | 192/31509 [00:00<01:30, 346.01it/s]","\rparsing log, completed traces ::   1%|          | 253/31509 [00:00<01:15, 414.15it/s]","\rparsing log, completed traces ::   1%|1         | 318/31509 [00:01<01:05, 474.99it/s]","\rparsing log, completed traces ::   1%|1         | 383/31509 [00:01<00:59, 519.73it/s]","\rparsing log, completed traces ::   1%|1         | 444/31509 [00:01<00:57, 541.16it/s]","\rparsing log, completed traces ::   2%|1         | 505/31509 [00:01<01:43, 299.31it/s]","\rparsing log, completed traces ::   2%|1         | 563/31509 [00:01<01:28, 348.62it/s]","\rparsing log, completed traces ::   2%|1         | 630/31509 [00:01<01:14, 413.55it/s]","\rparsing log, completed traces ::   2%|2         | 702/31509 [00:01<01:04, 479.84it/s]","\rparsing log, completed traces ::   2%|2         | 765/31509 [00:02<00:59, 513.80it/s]","\rparsing log, completed traces ::   3%|2         | 826/31509 [00:02<00:57, 536.89it/s]","\rparsing log, completed traces ::   3%|2         | 890/31509 [00:02<00:54, 563.67it/s]","\rparsing log, completed traces ::   3%|3         | 961/31509 [00:02<00:50, 603.30it/s]","\rparsing log, completed traces ::   3%|3         | 1028/31509 [00:02<00:48, 622.11it/s]","\rparsing log, completed traces ::   3%|3         | 1093/31509 [00:02<00:49, 609.98it/s]","\rparsing log, completed traces ::   4%|3         | 1160/31509 [00:02<00:48, 624.32it/s]","\rparsing log, completed traces ::   4%|3         | 1229/31509 [00:02<00:47, 640.87it/s]","\rparsing log, completed traces ::   4%|4         | 1295/31509 [00:02<00:46, 643.67it/s]","\rparsing log, completed traces ::   4%|4         | 1364/31509 [00:02<00:45, 657.16it/s]","\rparsing log, completed traces ::   5%|4         | 1431/31509 [00:03<00:46, 643.38it/s]","\rparsing log, completed traces ::   5%|4         | 1496/31509 [00:03<00:47, 636.95it/s]","\rparsing log, completed traces ::   5%|4         | 1562/31509 [00:03<00:46, 643.23it/s]","\rparsing log, completed traces ::   5%|5         | 1627/31509 [00:03<00:46, 642.45it/s]","\rparsing log, completed traces ::   5%|5         | 1692/31509 [00:03<01:30, 329.32it/s]","\rparsing log, completed traces ::   6%|5         | 1757/31509 [00:03<01:17, 384.74it/s]","\rparsing log, completed traces ::   6%|5         | 1816/31509 [00:04<01:09, 425.61it/s]","\rparsing log, completed traces ::   6%|5         | 1874/31509 [00:04<01:04, 458.39it/s]","\rparsing log, completed traces ::   6%|6         | 1939/31509 [00:04<00:58, 504.24it/s]","\rparsing log, completed traces ::   6%|6         | 2003/31509 [00:04<00:54, 538.05it/s]","\rparsing log, completed traces ::   7%|6         | 2066/31509 [00:04<00:52, 562.02it/s]","\rparsing log, completed traces ::   7%|6         | 2132/31509 [00:04<00:49, 588.42it/s]","\rparsing log, completed traces ::   7%|6         | 2198/31509 [00:04<00:48, 601.91it/s]","\rparsing log, completed traces ::   7%|7         | 2268/31509 [00:04<00:46, 627.75it/s]","\rparsing log, completed traces ::   7%|7         | 2334/31509 [00:04<00:45, 636.28it/s]","\rparsing log, completed traces ::   8%|7         | 2399/31509 [00:04<00:45, 635.95it/s]","\rparsing log, completed traces ::   8%|7         | 2464/31509 [00:05<00:45, 639.84it/s]","\rparsing log, completed traces ::   8%|8         | 2529/31509 [00:05<00:45, 640.66it/s]","\rparsing log, completed traces ::   8%|8         | 2604/31509 [00:05<00:43, 669.43it/s]","\rparsing log, completed traces ::   8%|8         | 2672/31509 [00:05<00:42, 672.12it/s]","\rparsing log, completed traces ::   9%|8         | 2740/31509 [00:05<00:43, 655.71it/s]","\rparsing log, completed traces ::   9%|8         | 2811/31509 [00:05<00:42, 668.39it/s]","\rparsing log, completed traces ::   9%|9         | 2885/31509 [00:05<00:41, 688.58it/s]","\rparsing log, completed traces ::   9%|9         | 2958/31509 [00:05<00:40, 697.22it/s]","\rparsing log, completed traces ::  10%|9         | 3028/31509 [00:05<00:41, 691.89it/s]","\rparsing log, completed traces ::  10%|9         | 3098/31509 [00:06<01:24, 335.69it/s]","\rparsing log, completed traces ::  10%|#         | 3164/31509 [00:06<01:12, 390.45it/s]","\rparsing log, completed traces ::  10%|#         | 3225/31509 [00:06<01:05, 432.95it/s]","\rparsing log, completed traces ::  10%|#         | 3298/31509 [00:06<00:56, 496.96it/s]","\rparsing log, completed traces ::  11%|#         | 3369/31509 [00:06<00:51, 545.85it/s]","\rparsing log, completed traces ::  11%|#         | 3445/31509 [00:06<00:46, 599.26it/s]","\rparsing log, completed traces ::  11%|#1        | 3522/31509 [00:06<00:43, 642.07it/s]","\rparsing log, completed traces ::  11%|#1        | 3593/31509 [00:07<00:43, 634.98it/s]","\rparsing log, completed traces ::  12%|#1        | 3665/31509 [00:07<00:42, 656.61it/s]","\rparsing log, completed traces ::  12%|#1        | 3734/31509 [00:07<00:41, 665.82it/s]","\rparsing log, completed traces ::  12%|#2        | 3803/31509 [00:07<00:41, 670.38it/s]","\rparsing log, completed traces ::  12%|#2        | 3872/31509 [00:07<00:41, 660.80it/s]","\rparsing log, completed traces ::  13%|#2        | 3943/31509 [00:07<00:40, 672.57it/s]","\rparsing log, completed traces ::  13%|#2        | 4015/31509 [00:07<00:40, 686.10it/s]","\rparsing log, completed traces ::  13%|#2        | 4085/31509 [00:07<00:41, 666.05it/s]","\rparsing log, completed traces ::  13%|#3        | 4155/31509 [00:07<00:40, 672.15it/s]","\rparsing log, completed traces ::  13%|#3        | 4223/31509 [00:07<00:41, 661.98it/s]","\rparsing log, completed traces ::  14%|#3        | 4290/31509 [00:08<00:41, 648.77it/s]","\rparsing log, completed traces ::  14%|#3        | 4358/31509 [00:08<00:41, 657.05it/s]","\rparsing log, completed traces ::  14%|#4        | 4427/31509 [00:08<00:40, 666.38it/s]","\rparsing log, completed traces ::  14%|#4        | 4494/31509 [00:08<00:41, 656.38it/s]","\rparsing log, completed traces ::  14%|#4        | 4562/31509 [00:08<00:41, 657.01it/s]","\rparsing log, completed traces ::  15%|#4        | 4628/31509 [00:08<01:29, 301.14it/s]","\rparsing log, completed traces ::  15%|#4        | 4701/31509 [00:09<01:12, 369.48it/s]","\rparsing log, completed traces ::  15%|#5        | 4772/31509 [00:09<01:01, 431.65it/s]","\rparsing log, completed traces ::  15%|#5        | 4846/31509 [00:09<00:54, 493.60it/s]","\rparsing log, completed traces ::  16%|#5        | 4911/31509 [00:09<00:50, 526.64it/s]","\rparsing log, completed traces ::  16%|#5        | 4981/31509 [00:09<00:46, 569.08it/s]","\rparsing log, completed traces ::  16%|#6        | 5054/31509 [00:09<00:43, 610.47it/s]","\rparsing log, completed traces ::  16%|#6        | 5127/31509 [00:09<00:41, 641.63it/s]","\rparsing log, completed traces ::  16%|#6        | 5197/31509 [00:09<00:40, 643.66it/s]","\rparsing log, completed traces ::  17%|#6        | 5268/31509 [00:09<00:39, 659.30it/s]","\rparsing log, completed traces ::  17%|#6        | 5337/31509 [00:10<00:39, 666.12it/s]","\rparsing log, completed traces ::  17%|#7        | 5406/31509 [00:10<00:39, 659.60it/s]","\rparsing log, completed traces ::  17%|#7        | 5478/31509 [00:10<00:38, 673.39it/s]","\rparsing log, completed traces ::  18%|#7        | 5550/31509 [00:10<00:37, 685.93it/s]","\rparsing log, completed traces ::  18%|#7        | 5625/31509 [00:10<00:36, 703.49it/s]","\rparsing log, completed traces ::  18%|#8        | 5701/31509 [00:10<00:36, 715.42it/s]","\rparsing log, completed traces ::  18%|#8        | 5777/31509 [00:10<00:35, 723.73it/s]","\rparsing log, completed traces ::  19%|#8        | 5850/31509 [00:10<00:35, 722.71it/s]","\rparsing log, completed traces ::  19%|#8        | 5928/31509 [00:10<00:34, 738.71it/s]","\rparsing log, completed traces ::  19%|#9        | 6003/31509 [00:10<00:35, 723.40it/s]","\rparsing log, completed traces ::  19%|#9        | 6076/31509 [00:11<00:35, 707.01it/s]","\rparsing log, completed traces ::  20%|#9        | 6147/31509 [00:11<00:36, 704.34it/s]","\rparsing log, completed traces ::  20%|#9        | 6218/31509 [00:11<00:36, 702.40it/s]","\rparsing log, completed traces ::  20%|#9        | 6289/31509 [00:11<00:36, 698.96it/s]","\rparsing log, completed traces ::  20%|##        | 6359/31509 [00:11<00:36, 692.23it/s]","\rparsing log, completed traces ::  20%|##        | 6429/31509 [00:11<01:22, 302.35it/s]","\rparsing log, completed traces ::  21%|##        | 6498/31509 [00:12<01:09, 361.69it/s]","\rparsing log, completed traces ::  21%|##        | 6556/31509 [00:12<01:02, 400.12it/s]","\rparsing log, completed traces ::  21%|##1       | 6621/31509 [00:12<00:55, 450.82it/s]","\rparsing log, completed traces ::  21%|##1       | 6687/31509 [00:12<00:49, 498.07it/s]","\rparsing log, completed traces ::  21%|##1       | 6755/31509 [00:12<00:45, 541.72it/s]","\rparsing log, completed traces ::  22%|##1       | 6825/31509 [00:12<00:42, 582.34it/s]","\rparsing log, completed traces ::  22%|##1       | 6891/31509 [00:12<00:40, 602.35it/s]","\rparsing log, completed traces ::  22%|##2       | 6959/31509 [00:12<00:39, 620.73it/s]","\rparsing log, completed traces ::  22%|##2       | 7035/31509 [00:12<00:37, 657.99it/s]","\rparsing log, completed traces ::  23%|##2       | 7104/31509 [00:13<00:36, 666.70it/s]","\rparsing log, completed traces ::  23%|##2       | 7173/31509 [00:13<00:36, 667.95it/s]","\rparsing log, completed traces ::  23%|##2       | 7242/31509 [00:13<00:36, 667.40it/s]","\rparsing log, completed traces ::  23%|##3       | 7310/31509 [00:13<00:36, 669.84it/s]","\rparsing log, completed traces ::  23%|##3       | 7378/31509 [00:13<00:36, 656.89it/s]","\rparsing log, completed traces ::  24%|##3       | 7446/31509 [00:13<00:36, 660.71it/s]","\rparsing log, completed traces ::  24%|##3       | 7521/31509 [00:13<00:35, 685.31it/s]","\rparsing log, completed traces ::  24%|##4       | 7594/31509 [00:13<00:34, 695.90it/s]","\rparsing log, completed traces ::  24%|##4       | 7664/31509 [00:13<00:35, 671.80it/s]","\rparsing log, completed traces ::  25%|##4       | 7732/31509 [00:13<00:35, 666.17it/s]","\rparsing log, completed traces ::  25%|##4       | 7799/31509 [00:14<00:36, 653.62it/s]","\rparsing log, completed traces ::  25%|##4       | 7872/31509 [00:14<00:35, 671.64it/s]","\rparsing log, completed traces ::  25%|##5       | 7941/31509 [00:14<00:35, 672.07it/s]","\rparsing log, completed traces ::  25%|##5       | 8012/31509 [00:14<00:34, 682.72it/s]","\rparsing log, completed traces ::  26%|##5       | 8081/31509 [00:14<00:34, 682.30it/s]","\rparsing log, completed traces ::  26%|##5       | 8150/31509 [00:14<00:34, 681.27it/s]","\rparsing log, completed traces ::  26%|##6       | 8224/31509 [00:14<00:33, 696.69it/s]","\rparsing log, completed traces ::  26%|##6       | 8295/31509 [00:14<00:33, 699.56it/s]","\rparsing log, completed traces ::  27%|##6       | 8365/31509 [00:15<01:25, 271.34it/s]","\rparsing log, completed traces ::  27%|##6       | 8427/31509 [00:15<01:12, 320.38it/s]","\rparsing log, completed traces ::  27%|##6       | 8499/31509 [00:15<00:59, 386.08it/s]","\rparsing log, completed traces ::  27%|##7       | 8561/31509 [00:15<00:53, 429.88it/s]","\rparsing log, completed traces ::  27%|##7       | 8630/31509 [00:15<00:47, 485.59it/s]","\rparsing log, completed traces ::  28%|##7       | 8699/31509 [00:15<00:42, 530.84it/s]","\rparsing log, completed traces ::  28%|##7       | 8768/31509 [00:15<00:39, 569.04it/s]","\rparsing log, completed traces ::  28%|##8       | 8835/31509 [00:16<00:38, 594.87it/s]","\rparsing log, completed traces ::  28%|##8       | 8901/31509 [00:16<00:37, 606.16it/s]","\rparsing log, completed traces ::  28%|##8       | 8970/31509 [00:16<00:35, 626.89it/s]","\rparsing log, completed traces ::  29%|##8       | 9036/31509 [00:16<00:36, 622.20it/s]","\rparsing log, completed traces ::  29%|##8       | 9101/31509 [00:16<00:35, 626.33it/s]","\rparsing log, completed traces ::  29%|##9       | 9169/31509 [00:16<00:34, 638.99it/s]","\rparsing log, completed traces ::  29%|##9       | 9235/31509 [00:16<00:35, 626.22it/s]","\rparsing log, completed traces ::  30%|##9       | 9299/31509 [00:16<00:35, 624.39it/s]","\rparsing log, completed traces ::  30%|##9       | 9368/31509 [00:16<00:34, 640.68it/s]","\rparsing log, completed traces ::  30%|##9       | 9433/31509 [00:17<00:35, 628.14it/s]","\rparsing log, completed traces ::  30%|###       | 9500/31509 [00:17<00:34, 637.39it/s]","\rparsing log, completed traces ::  30%|###       | 9567/31509 [00:17<00:33, 645.74it/s]","\rparsing log, completed traces ::  31%|###       | 9635/31509 [00:17<00:33, 655.56it/s]","\rparsing log, completed traces ::  31%|###       | 9701/31509 [00:17<00:34, 636.21it/s]","\rparsing log, completed traces ::  31%|###       | 9766/31509 [00:17<00:33, 639.71it/s]","\rparsing log, completed traces ::  31%|###1      | 9831/31509 [00:17<00:33, 640.78it/s]","\rparsing log, completed traces ::  31%|###1      | 9896/31509 [00:17<00:34, 633.07it/s]","\rparsing log, completed traces ::  32%|###1      | 9962/31509 [00:17<00:33, 639.19it/s]","\rparsing log, completed traces ::  32%|###1      | 10026/31509 [00:17<00:33, 635.33it/s]","\rparsing log, completed traces ::  32%|###2      | 10090/31509 [00:18<00:34, 612.39it/s]","\rparsing log, completed traces ::  32%|###2      | 10152/31509 [00:18<00:34, 614.21it/s]","\rparsing log, completed traces ::  32%|###2      | 10220/31509 [00:18<00:33, 632.85it/s]","\rparsing log, completed traces ::  33%|###2      | 10285/31509 [00:18<00:33, 636.43it/s]","\rparsing log, completed traces ::  33%|###2      | 10349/31509 [00:18<00:34, 615.41it/s]","\rparsing log, completed traces ::  33%|###3      | 10411/31509 [00:19<01:30, 233.70it/s]","\rparsing log, completed traces ::  33%|###3      | 10472/31509 [00:19<01:13, 284.64it/s]","\rparsing log, completed traces ::  33%|###3      | 10534/31509 [00:19<01:01, 338.50it/s]","\rparsing log, completed traces ::  34%|###3      | 10601/31509 [00:19<00:52, 400.00it/s]","\rparsing log, completed traces ::  34%|###3      | 10662/31509 [00:19<00:46, 443.59it/s]","\rparsing log, completed traces ::  34%|###4      | 10722/31509 [00:19<00:43, 478.92it/s]","\rparsing log, completed traces ::  34%|###4      | 10782/31509 [00:19<00:40, 506.68it/s]","\rparsing log, completed traces ::  34%|###4      | 10841/31509 [00:19<00:39, 518.94it/s]","\rparsing log, completed traces ::  35%|###4      | 10900/31509 [00:19<00:38, 536.63it/s]","\rparsing log, completed traces ::  35%|###4      | 10961/31509 [00:20<00:37, 553.89it/s]","\rparsing log, completed traces ::  35%|###4      | 11028/31509 [00:20<00:35, 583.97it/s]","\rparsing log, completed traces ::  35%|###5      | 11094/31509 [00:20<00:33, 604.94it/s]","\rparsing log, completed traces ::  35%|###5      | 11159/31509 [00:20<00:32, 617.01it/s]","\rparsing log, completed traces ::  36%|###5      | 11225/31509 [00:20<00:32, 628.13it/s]","\rparsing log, completed traces ::  36%|###5      | 11294/31509 [00:20<00:31, 645.76it/s]","\rparsing log, completed traces ::  36%|###6      | 11360/31509 [00:20<00:31, 632.69it/s]","\rparsing log, completed traces ::  36%|###6      | 11424/31509 [00:20<00:31, 633.53it/s]","\rparsing log, completed traces ::  36%|###6      | 11489/31509 [00:20<00:31, 635.57it/s]","\rparsing log, completed traces ::  37%|###6      | 11553/31509 [00:20<00:32, 622.80it/s]","\rparsing log, completed traces ::  37%|###6      | 11619/31509 [00:21<00:31, 631.16it/s]","\rparsing log, completed traces ::  37%|###7      | 11683/31509 [00:21<00:31, 628.35it/s]","\rparsing log, completed traces ::  37%|###7      | 11750/31509 [00:21<00:30, 640.11it/s]","\rparsing log, completed traces ::  38%|###7      | 11818/31509 [00:21<00:30, 649.95it/s]","\rparsing log, completed traces ::  38%|###7      | 11887/31509 [00:21<00:29, 661.04it/s]","\rparsing log, completed traces ::  38%|###7      | 11958/31509 [00:21<00:29, 673.61it/s]","\rparsing log, completed traces ::  38%|###8      | 12026/31509 [00:21<00:29, 659.57it/s]","\rparsing log, completed traces ::  38%|###8      | 12093/31509 [00:21<00:29, 661.30it/s]","\rparsing log, completed traces ::  39%|###8      | 12160/31509 [00:21<00:29, 654.34it/s]","\rparsing log, completed traces ::  39%|###8      | 12229/31509 [00:22<00:29, 664.54it/s]","\rparsing log, completed traces ::  39%|###9      | 12296/31509 [00:22<00:29, 654.98it/s]","\rparsing log, completed traces ::  39%|###9      | 12365/31509 [00:22<00:28, 662.77it/s]","\rparsing log, completed traces ::  39%|###9      | 12432/31509 [00:22<00:28, 658.73it/s]","\rparsing log, completed traces ::  40%|###9      | 12499/31509 [00:22<00:28, 659.49it/s]","\rparsing log, completed traces ::  40%|###9      | 12565/31509 [00:22<00:29, 648.09it/s]","\rparsing log, completed traces ::  40%|####      | 12634/31509 [00:22<00:28, 659.00it/s]","\rparsing log, completed traces ::  40%|####      | 12700/31509 [00:23<01:20, 233.94it/s]","\rparsing log, completed traces ::  41%|####      | 12764/31509 [00:23<01:05, 286.68it/s]","\rparsing log, completed traces ::  41%|####      | 12829/31509 [00:23<00:54, 343.16it/s]","\rparsing log, completed traces ::  41%|####      | 12894/31509 [00:23<00:46, 398.97it/s]","\rparsing log, completed traces ::  41%|####1     | 12957/31509 [00:23<00:41, 445.87it/s]","\rparsing log, completed traces ::  41%|####1     | 13025/31509 [00:23<00:37, 499.03it/s]","\rparsing log, completed traces ::  42%|####1     | 13101/31509 [00:23<00:32, 563.00it/s]","\rparsing log, completed traces ::  42%|####1     | 13168/31509 [00:24<00:31, 578.16it/s]","\rparsing log, completed traces ::  42%|####2     | 13234/31509 [00:24<00:30, 594.03it/s]","\rparsing log, completed traces ::  42%|####2     | 13299/31509 [00:24<00:29, 607.16it/s]","\rparsing log, completed traces ::  42%|####2     | 13364/31509 [00:24<00:29, 614.29it/s]","\rparsing log, completed traces ::  43%|####2     | 13432/31509 [00:24<00:28, 632.86it/s]","\rparsing log, completed traces ::  43%|####2     | 13498/31509 [00:24<00:28, 631.68it/s]","\rparsing log, completed traces ::  43%|####3     | 13563/31509 [00:24<00:28, 629.51it/s]","\rparsing log, completed traces ::  43%|####3     | 13627/31509 [00:24<00:29, 615.19it/s]","\rparsing log, completed traces ::  43%|####3     | 13690/31509 [00:24<00:28, 617.51it/s]","\rparsing log, completed traces ::  44%|####3     | 13758/31509 [00:24<00:27, 635.48it/s]","\rparsing log, completed traces ::  44%|####3     | 13824/31509 [00:25<00:27, 636.72it/s]","\rparsing log, completed traces ::  44%|####4     | 13888/31509 [00:25<00:27, 631.47it/s]","\rparsing log, completed traces ::  44%|####4     | 13956/31509 [00:25<00:27, 645.60it/s]","\rparsing log, completed traces ::  45%|####4     | 14023/31509 [00:25<00:26, 651.72it/s]","\rparsing log, completed traces ::  45%|####4     | 14089/31509 [00:25<00:26, 652.51it/s]","\rparsing log, completed traces ::  45%|####4     | 14160/31509 [00:25<00:26, 664.33it/s]","\rparsing log, completed traces ::  45%|####5     | 14227/31509 [00:25<00:25, 665.23it/s]","\rparsing log, completed traces ::  45%|####5     | 14294/31509 [00:25<00:25, 662.86it/s]","\rparsing log, completed traces ::  46%|####5     | 14365/31509 [00:25<00:25, 675.17it/s]","\rparsing log, completed traces ::  46%|####5     | 14433/31509 [00:25<00:25, 676.01it/s]","\rparsing log, completed traces ::  46%|####6     | 14501/31509 [00:26<00:25, 673.93it/s]","\rparsing log, completed traces ::  46%|####6     | 14569/31509 [00:26<00:26, 646.62it/s]","\rparsing log, completed traces ::  46%|####6     | 14634/31509 [00:26<00:26, 647.07it/s]","\rparsing log, completed traces ::  47%|####6     | 14702/31509 [00:26<00:25, 655.65it/s]","\rparsing log, completed traces ::  47%|####6     | 14768/31509 [00:26<00:25, 651.77it/s]","\rparsing log, completed traces ::  47%|####7     | 14838/31509 [00:26<00:25, 663.89it/s]","\rparsing log, completed traces ::  47%|####7     | 14905/31509 [00:26<00:25, 657.99it/s]","\rparsing log, completed traces ::  48%|####7     | 14977/31509 [00:26<00:24, 673.06it/s]","\rparsing log, completed traces ::  48%|####7     | 15045/31509 [00:26<00:24, 673.73it/s]","\rparsing log, completed traces ::  48%|####7     | 15116/31509 [00:27<00:24, 682.29it/s]","\rparsing log, completed traces ::  48%|####8     | 15186/31509 [00:27<00:23, 685.72it/s]","\rparsing log, completed traces ::  48%|####8     | 15255/31509 [00:27<00:23, 680.02it/s]","\rparsing log, completed traces ::  49%|####8     | 15330/31509 [00:27<00:23, 698.69it/s]","\rparsing log, completed traces ::  49%|####8     | 15400/31509 [00:27<00:23, 695.34it/s]","\rparsing log, completed traces ::  49%|####9     | 15470/31509 [00:28<01:08, 232.94it/s]","\rparsing log, completed traces ::  49%|####9     | 15540/31509 [00:28<00:54, 290.73it/s]","\rparsing log, completed traces ::  50%|####9     | 15613/31509 [00:28<00:44, 356.10it/s]","\rparsing log, completed traces ::  50%|####9     | 15685/31509 [00:28<00:37, 419.81it/s]","\rparsing log, completed traces ::  50%|####9     | 15751/31509 [00:28<00:33, 467.34it/s]","\rparsing log, completed traces ::  50%|#####     | 15819/31509 [00:28<00:30, 514.66it/s]","\rparsing log, completed traces ::  50%|#####     | 15893/31509 [00:28<00:27, 568.40it/s]","\rparsing log, completed traces ::  51%|#####     | 15962/31509 [00:28<00:25, 598.51it/s]","\rparsing log, completed traces ::  51%|#####     | 16031/31509 [00:29<00:25, 613.93it/s]","\rparsing log, completed traces ::  51%|#####1    | 16104/31509 [00:29<00:23, 643.59it/s]","\rparsing log, completed traces ::  51%|#####1    | 16177/31509 [00:29<00:22, 666.80it/s]","\rparsing log, completed traces ::  52%|#####1    | 16247/31509 [00:29<00:22, 668.69it/s]","\rparsing log, completed traces ::  52%|#####1    | 16320/31509 [00:29<00:22, 680.40it/s]","\rparsing log, completed traces ::  52%|#####2    | 16390/31509 [00:29<00:23, 656.41it/s]","\rparsing log, completed traces ::  52%|#####2    | 16457/31509 [00:29<00:23, 652.93it/s]","\rparsing log, completed traces ::  52%|#####2    | 16524/31509 [00:29<00:23, 633.08it/s]","\rparsing log, completed traces ::  53%|#####2    | 16594/31509 [00:29<00:22, 651.66it/s]","\rparsing log, completed traces ::  53%|#####2    | 16666/31509 [00:29<00:22, 669.90it/s]","\rparsing log, completed traces ::  53%|#####3    | 16734/31509 [00:30<00:22, 663.24it/s]","\rparsing log, completed traces ::  53%|#####3    | 16801/31509 [00:30<00:22, 663.00it/s]","\rparsing log, completed traces ::  54%|#####3    | 16871/31509 [00:30<00:21, 673.21it/s]","\rparsing log, completed traces ::  54%|#####3    | 16939/31509 [00:30<00:21, 674.35it/s]","\rparsing log, completed traces ::  54%|#####3    | 17007/31509 [00:30<00:21, 673.91it/s]","\rparsing log, completed traces ::  54%|#####4    | 17084/31509 [00:30<00:20, 702.33it/s]","\rparsing log, completed traces ::  54%|#####4    | 17155/31509 [00:30<00:20, 691.26it/s]","\rparsing log, completed traces ::  55%|#####4    | 17225/31509 [00:30<00:21, 675.63it/s]","\rparsing log, completed traces ::  55%|#####4    | 17296/31509 [00:30<00:20, 683.66it/s]","\rparsing log, completed traces ::  55%|#####5    | 17365/31509 [00:30<00:20, 675.12it/s]","\rparsing log, completed traces ::  55%|#####5    | 17440/31509 [00:31<00:20, 694.61it/s]","\rparsing log, completed traces ::  56%|#####5    | 17510/31509 [00:31<00:21, 657.47it/s]","\rparsing log, completed traces ::  56%|#####5    | 17582/31509 [00:31<00:20, 673.15it/s]","\rparsing log, completed traces ::  56%|#####6    | 17656/31509 [00:31<00:20, 691.73it/s]","\rparsing log, completed traces ::  56%|#####6    | 17726/31509 [00:31<00:20, 687.80it/s]","\rparsing log, completed traces ::  56%|#####6    | 17796/31509 [00:31<00:20, 685.44it/s]","\rparsing log, completed traces ::  57%|#####6    | 17868/31509 [00:31<00:19, 692.37it/s]","\rparsing log, completed traces ::  57%|#####6    | 17938/31509 [00:31<00:19, 686.93it/s]","\rparsing log, completed traces ::  57%|#####7    | 18009/31509 [00:31<00:19, 693.63it/s]","\rparsing log, completed traces ::  57%|#####7    | 18082/31509 [00:32<00:19, 702.39it/s]","\rparsing log, completed traces ::  58%|#####7    | 18153/31509 [00:32<00:19, 701.78it/s]","\rparsing log, completed traces ::  58%|#####7    | 18224/31509 [00:32<00:19, 688.16it/s]","\rparsing log, completed traces ::  58%|#####8    | 18296/31509 [00:32<00:18, 697.23it/s]","\rparsing log, completed traces ::  58%|#####8    | 18366/31509 [00:32<00:19, 687.70it/s]","\rparsing log, completed traces ::  59%|#####8    | 18438/31509 [00:32<00:18, 695.36it/s]","\rparsing log, completed traces ::  59%|#####8    | 18508/31509 [00:32<00:18, 694.49it/s]","\rparsing log, completed traces ::  59%|#####8    | 18578/31509 [00:32<00:19, 671.69it/s]","\rparsing log, completed traces ::  59%|#####9    | 18646/31509 [00:33<01:02, 206.99it/s]","\rparsing log, completed traces ::  59%|#####9    | 18723/31509 [00:33<00:47, 270.11it/s]","\rparsing log, completed traces ::  60%|#####9    | 18790/31509 [00:33<00:39, 324.99it/s]","\rparsing log, completed traces ::  60%|#####9    | 18860/31509 [00:33<00:32, 386.24it/s]","\rparsing log, completed traces ::  60%|######    | 18940/31509 [00:34<00:27, 463.46it/s]","\rparsing log, completed traces ::  60%|######    | 19010/31509 [00:34<00:24, 512.34it/s]","\rparsing log, completed traces ::  61%|######    | 19081/31509 [00:34<00:22, 557.89it/s]","\rparsing log, completed traces ::  61%|######    | 19155/31509 [00:34<00:20, 602.95it/s]","\rparsing log, completed traces ::  61%|######1   | 19226/31509 [00:34<00:20, 609.91it/s]","\rparsing log, completed traces ::  61%|######1   | 19298/31509 [00:34<00:19, 637.48it/s]","\rparsing log, completed traces ::  61%|######1   | 19371/31509 [00:34<00:18, 660.21it/s]","\rparsing log, completed traces ::  62%|######1   | 19445/31509 [00:34<00:17, 681.24it/s]","\rparsing log, completed traces ::  62%|######1   | 19516/31509 [00:34<00:17, 682.93it/s]","\rparsing log, completed traces ::  62%|######2   | 19589/31509 [00:34<00:17, 693.83it/s]","\rparsing log, completed traces ::  62%|######2   | 19660/31509 [00:35<00:17, 691.12it/s]","\rparsing log, completed traces ::  63%|######2   | 19731/31509 [00:35<00:17, 686.39it/s]","\rparsing log, completed traces ::  63%|######2   | 19801/31509 [00:35<00:17, 660.85it/s]","\rparsing log, completed traces ::  63%|######3   | 19869/31509 [00:35<00:17, 665.22it/s]","\rparsing log, completed traces ::  63%|######3   | 19937/31509 [00:35<00:17, 665.57it/s]","\rparsing log, completed traces ::  63%|######3   | 20004/31509 [00:35<00:17, 660.61it/s]","\rparsing log, completed traces ::  64%|######3   | 20073/31509 [00:35<00:17, 666.74it/s]","\rparsing log, completed traces ::  64%|######3   | 20141/31509 [00:35<00:16, 668.79it/s]","\rparsing log, completed traces ::  64%|######4   | 20213/31509 [00:35<00:16, 681.77it/s]","\rparsing log, completed traces ::  64%|######4   | 20287/31509 [00:35<00:16, 698.33it/s]","\rparsing log, completed traces ::  65%|######4   | 20357/31509 [00:36<00:16, 686.10it/s]","\rparsing log, completed traces ::  65%|######4   | 20434/31509 [00:36<00:15, 710.39it/s]","\rparsing log, completed traces ::  65%|######5   | 20506/31509 [00:36<00:15, 707.12it/s]","\rparsing log, completed traces ::  65%|######5   | 20578/31509 [00:36<00:15, 710.68it/s]","\rparsing log, completed traces ::  66%|######5   | 20656/31509 [00:36<00:14, 728.56it/s]","\rparsing log, completed traces ::  66%|######5   | 20730/31509 [00:36<00:14, 730.86it/s]","\rparsing log, completed traces ::  66%|######6   | 20804/31509 [00:36<00:14, 726.83it/s]","\rparsing log, completed traces ::  66%|######6   | 20877/31509 [00:36<00:14, 717.31it/s]","\rparsing log, completed traces ::  66%|######6   | 20949/31509 [00:36<00:15, 697.31it/s]","\rparsing log, completed traces ::  67%|######6   | 21019/31509 [00:37<00:15, 691.72it/s]","\rparsing log, completed traces ::  67%|######6   | 21089/31509 [00:37<00:15, 679.93it/s]","\rparsing log, completed traces ::  67%|######7   | 21158/31509 [00:37<00:15, 671.71it/s]","\rparsing log, completed traces ::  67%|######7   | 21232/31509 [00:37<00:14, 690.30it/s]","\rparsing log, completed traces ::  68%|######7   | 21302/31509 [00:37<00:14, 692.94it/s]","\rparsing log, completed traces ::  68%|######7   | 21372/31509 [00:37<00:14, 689.61it/s]","\rparsing log, completed traces ::  68%|######8   | 21447/31509 [00:37<00:14, 706.15it/s]","\rparsing log, completed traces ::  68%|######8   | 21522/31509 [00:37<00:13, 718.73it/s]","\rparsing log, completed traces ::  69%|######8   | 21595/31509 [00:37<00:13, 721.00it/s]","\rparsing log, completed traces ::  69%|######8   | 21668/31509 [00:37<00:14, 696.40it/s]","\rparsing log, completed traces ::  69%|######9   | 21748/31509 [00:38<00:13, 724.55it/s]","\rparsing log, completed traces ::  69%|######9   | 21821/31509 [00:38<00:13, 719.26it/s]","\rparsing log, completed traces ::  69%|######9   | 21898/31509 [00:38<00:13, 734.04it/s]","\rparsing log, completed traces ::  70%|######9   | 21972/31509 [00:38<00:13, 722.95it/s]","\rparsing log, completed traces ::  70%|######9   | 22050/31509 [00:38<00:12, 737.82it/s]","\rparsing log, completed traces ::  70%|#######   | 22124/31509 [00:38<00:12, 728.26it/s]","\rparsing log, completed traces ::  70%|#######   | 22199/31509 [00:38<00:12, 730.24it/s]","\rparsing log, completed traces ::  71%|#######   | 22273/31509 [00:39<00:45, 203.72it/s]","\rparsing log, completed traces ::  71%|#######   | 22346/31509 [00:39<00:35, 258.00it/s]","\rparsing log, completed traces ::  71%|#######1  | 22422/31509 [00:39<00:28, 323.03it/s]","\rparsing log, completed traces ::  71%|#######1  | 22497/31509 [00:39<00:23, 389.14it/s]","\rparsing log, completed traces ::  72%|#######1  | 22566/31509 [00:40<00:20, 443.11it/s]","\rparsing log, completed traces ::  72%|#######1  | 22638/31509 [00:40<00:17, 499.88it/s]","\rparsing log, completed traces ::  72%|#######2  | 22710/31509 [00:40<00:16, 549.68it/s]","\rparsing log, completed traces ::  72%|#######2  | 22784/31509 [00:40<00:14, 594.33it/s]","\rparsing log, completed traces ::  73%|#######2  | 22856/31509 [00:40<00:13, 626.20it/s]","\rparsing log, completed traces ::  73%|#######2  | 22927/31509 [00:40<00:13, 633.89it/s]","\rparsing log, completed traces ::  73%|#######2  | 22997/31509 [00:40<00:13, 649.83it/s]","\rparsing log, completed traces ::  73%|#######3  | 23067/31509 [00:40<00:12, 659.02it/s]","\rparsing log, completed traces ::  73%|#######3  | 23136/31509 [00:40<00:12, 666.86it/s]","\rparsing log, completed traces ::  74%|#######3  | 23205/31509 [00:40<00:12, 666.18it/s]","\rparsing log, completed traces ::  74%|#######3  | 23274/31509 [00:41<00:12, 665.97it/s]","\rparsing log, completed traces ::  74%|#######4  | 23342/31509 [00:41<00:12, 668.91it/s]","\rparsing log, completed traces ::  74%|#######4  | 23410/31509 [00:41<00:12, 663.86it/s]","\rparsing log, completed traces ::  75%|#######4  | 23478/31509 [00:41<00:12, 666.07it/s]","\rparsing log, completed traces ::  75%|#######4  | 23550/31509 [00:41<00:11, 680.50it/s]","\rparsing log, completed traces ::  75%|#######4  | 23621/31509 [00:41<00:11, 686.29it/s]","\rparsing log, completed traces ::  75%|#######5  | 23692/31509 [00:41<00:11, 693.06it/s]","\rparsing log, completed traces ::  75%|#######5  | 23765/31509 [00:41<00:11, 700.45it/s]","\rparsing log, completed traces ::  76%|#######5  | 23836/31509 [00:41<00:11, 690.84it/s]","\rparsing log, completed traces ::  76%|#######5  | 23907/31509 [00:42<00:10, 696.44it/s]","\rparsing log, completed traces ::  76%|#######6  | 23977/31509 [00:42<00:10, 688.51it/s]","\rparsing log, completed traces ::  76%|#######6  | 24046/31509 [00:42<00:10, 683.51it/s]","\rparsing log, completed traces ::  77%|#######6  | 24116/31509 [00:42<00:10, 686.50it/s]","\rparsing log, completed traces ::  77%|#######6  | 24185/31509 [00:42<00:10, 686.12it/s]","\rparsing log, completed traces ::  77%|#######6  | 24254/31509 [00:42<00:10, 687.16it/s]","\rparsing log, completed traces ::  77%|#######7  | 24326/31509 [00:42<00:10, 695.90it/s]","\rparsing log, completed traces ::  77%|#######7  | 24397/31509 [00:42<00:10, 700.05it/s]","\rparsing log, completed traces ::  78%|#######7  | 24468/31509 [00:42<00:10, 695.81it/s]","\rparsing log, completed traces ::  78%|#######7  | 24538/31509 [00:42<00:10, 691.52it/s]","\rparsing log, completed traces ::  78%|#######8  | 24615/31509 [00:43<00:09, 713.61it/s]","\rparsing log, completed traces ::  78%|#######8  | 24687/31509 [00:43<00:09, 705.71it/s]","\rparsing log, completed traces ::  79%|#######8  | 24760/31509 [00:43<00:09, 710.52it/s]","\rparsing log, completed traces ::  79%|#######8  | 24834/31509 [00:43<00:09, 715.93it/s]","\rparsing log, completed traces ::  79%|#######9  | 24906/31509 [00:43<00:09, 713.64it/s]","\rparsing log, completed traces ::  79%|#######9  | 24982/31509 [00:43<00:08, 727.33it/s]","\rparsing log, completed traces ::  80%|#######9  | 25055/31509 [00:43<00:09, 713.21it/s]","\rparsing log, completed traces ::  80%|#######9  | 25127/31509 [00:43<00:09, 698.29it/s]","\rparsing log, completed traces ::  80%|#######9  | 25201/31509 [00:43<00:08, 709.56it/s]","\rparsing log, completed traces ::  80%|########  | 25273/31509 [00:43<00:09, 691.96it/s]","\rparsing log, completed traces ::  80%|########  | 25343/31509 [00:44<00:09, 663.45it/s]","\rparsing log, completed traces ::  81%|########  | 25423/31509 [00:44<00:08, 698.20it/s]","\rparsing log, completed traces ::  81%|########  | 25494/31509 [00:44<00:08, 693.09it/s]","\rparsing log, completed traces ::  81%|########1 | 25566/31509 [00:44<00:08, 699.07it/s]","\rparsing log, completed traces ::  81%|########1 | 25637/31509 [00:44<00:08, 686.44it/s]","\rparsing log, completed traces ::  82%|########1 | 25707/31509 [00:44<00:08, 688.47it/s]","\rparsing log, completed traces ::  82%|########1 | 25777/31509 [00:44<00:08, 690.66it/s]","\rparsing log, completed traces ::  82%|########2 | 25847/31509 [00:44<00:08, 679.30it/s]","\rparsing log, completed traces ::  82%|########2 | 25916/31509 [00:44<00:08, 680.66it/s]","\rparsing log, completed traces ::  82%|########2 | 25985/31509 [00:44<00:08, 682.09it/s]","\rparsing log, completed traces ::  83%|########2 | 26054/31509 [00:45<00:08, 672.64it/s]","\rparsing log, completed traces ::  83%|########2 | 26122/31509 [00:45<00:08, 669.04it/s]","\rparsing log, completed traces ::  83%|########3 | 26194/31509 [00:45<00:07, 681.13it/s]","\rparsing log, completed traces ::  83%|########3 | 26263/31509 [00:45<00:07, 680.94it/s]","\rparsing log, completed traces ::  84%|########3 | 26332/31509 [00:46<00:29, 176.13it/s]","\rparsing log, completed traces ::  84%|########3 | 26404/31509 [00:46<00:22, 229.08it/s]","\rparsing log, completed traces ::  84%|########4 | 26472/31509 [00:46<00:17, 283.85it/s]","\rparsing log, completed traces ::  84%|########4 | 26535/31509 [00:46<00:14, 334.48it/s]","\rparsing log, completed traces ::  84%|########4 | 26601/31509 [00:46<00:12, 389.85it/s]","\rparsing log, completed traces ::  85%|########4 | 26670/31509 [00:46<00:10, 449.26it/s]","\rparsing log, completed traces ::  85%|########4 | 26743/31509 [00:47<00:09, 510.67it/s]","\rparsing log, completed traces ::  85%|########5 | 26810/31509 [00:47<00:08, 544.93it/s]","\rparsing log, completed traces ::  85%|########5 | 26876/31509 [00:47<00:08, 570.60it/s]","\rparsing log, completed traces ::  86%|########5 | 26946/31509 [00:47<00:07, 604.02it/s]","\rparsing log, completed traces ::  86%|########5 | 27013/31509 [00:47<00:07, 612.20it/s]","\rparsing log, completed traces ::  86%|########5 | 27080/31509 [00:47<00:07, 624.87it/s]","\rparsing log, completed traces ::  86%|########6 | 27152/31509 [00:47<00:06, 650.79it/s]","\rparsing log, completed traces ::  86%|########6 | 27222/31509 [00:47<00:06, 664.75it/s]","\rparsing log, completed traces ::  87%|########6 | 27293/31509 [00:47<00:06, 677.12it/s]","\rparsing log, completed traces ::  87%|########6 | 27362/31509 [00:48<00:06, 665.52it/s]","\rparsing log, completed traces ::  87%|########7 | 27431/31509 [00:48<00:06, 670.22it/s]","\rparsing log, completed traces ::  87%|########7 | 27499/31509 [00:48<00:05, 670.81it/s]","\rparsing log, completed traces ::  87%|########7 | 27570/31509 [00:48<00:05, 681.86it/s]","\rparsing log, completed traces ::  88%|########7 | 27641/31509 [00:48<00:05, 689.35it/s]","\rparsing log, completed traces ::  88%|########7 | 27714/31509 [00:48<00:05, 699.90it/s]","\rparsing log, completed traces ::  88%|########8 | 27788/31509 [00:48<00:05, 709.39it/s]","\rparsing log, completed traces ::  88%|########8 | 27860/31509 [00:48<00:05, 692.32it/s]","\rparsing log, completed traces ::  89%|########8 | 27930/31509 [00:48<00:05, 685.82it/s]","\rparsing log, completed traces ::  89%|########8 | 27999/31509 [00:48<00:05, 684.85it/s]","\rparsing log, completed traces ::  89%|########9 | 28068/31509 [00:49<00:05, 680.64it/s]","\rparsing log, completed traces ::  89%|########9 | 28137/31509 [00:49<00:05, 669.63it/s]","\rparsing log, completed traces ::  90%|########9 | 28205/31509 [00:49<00:04, 670.38it/s]","\rparsing log, completed traces ::  90%|########9 | 28279/31509 [00:49<00:04, 687.32it/s]","\rparsing log, completed traces ::  90%|########9 | 28348/31509 [00:49<00:04, 677.19it/s]","\rparsing log, completed traces ::  90%|######### | 28416/31509 [00:49<00:04, 672.59it/s]","\rparsing log, completed traces ::  90%|######### | 28486/31509 [00:49<00:04, 680.41it/s]","\rparsing log, completed traces ::  91%|######### | 28555/31509 [00:49<00:04, 681.67it/s]","\rparsing log, completed traces ::  91%|######### | 28626/31509 [00:49<00:04, 689.80it/s]","\rparsing log, completed traces ::  91%|#########1| 28696/31509 [00:49<00:04, 676.41it/s]","\rparsing log, completed traces ::  91%|#########1| 28764/31509 [00:50<00:04, 646.40it/s]","\rparsing log, completed traces ::  91%|#########1| 28829/31509 [00:50<00:04, 631.95it/s]","\rparsing log, completed traces ::  92%|#########1| 28893/31509 [00:50<00:04, 626.13it/s]","\rparsing log, completed traces ::  92%|#########1| 28963/31509 [00:50<00:03, 647.07it/s]","\rparsing log, completed traces ::  92%|#########2| 29032/31509 [00:50<00:03, 657.73it/s]","\rparsing log, completed traces ::  92%|#########2| 29098/31509 [00:50<00:03, 653.14it/s]","\rparsing log, completed traces ::  93%|#########2| 29166/31509 [00:50<00:03, 660.30it/s]","\rparsing log, completed traces ::  93%|#########2| 29238/31509 [00:50<00:03, 677.30it/s]","\rparsing log, completed traces ::  93%|#########3| 29306/31509 [00:50<00:03, 671.63it/s]","\rparsing log, completed traces ::  93%|#########3| 29374/31509 [00:51<00:03, 665.94it/s]","\rparsing log, completed traces ::  93%|#########3| 29441/31509 [00:51<00:03, 650.40it/s]","\rparsing log, completed traces ::  94%|#########3| 29507/31509 [00:51<00:03, 633.91it/s]","\rparsing log, completed traces ::  94%|#########3| 29571/31509 [00:51<00:03, 629.06it/s]","\rparsing log, completed traces ::  94%|#########4| 29644/31509 [00:51<00:02, 656.80it/s]","\rparsing log, completed traces ::  94%|#########4| 29716/31509 [00:51<00:02, 673.91it/s]","\rparsing log, completed traces ::  95%|#########4| 29784/31509 [00:51<00:02, 657.54it/s]","\rparsing log, completed traces ::  95%|#########4| 29850/31509 [00:51<00:02, 654.73it/s]","\rparsing log, completed traces ::  95%|#########4| 29919/31509 [00:51<00:02, 663.56it/s]","\rparsing log, completed traces ::  95%|#########5| 29989/31509 [00:51<00:02, 673.04it/s]","\rparsing log, completed traces ::  95%|#########5| 30057/31509 [00:52<00:02, 659.25it/s]","\rparsing log, completed traces ::  96%|#########5| 30130/31509 [00:52<00:02, 678.37it/s]","\rparsing log, completed traces ::  96%|#########5| 30198/31509 [00:52<00:01, 677.55it/s]","\rparsing log, completed traces ::  96%|#########6| 30267/31509 [00:52<00:01, 678.37it/s]","\rparsing log, completed traces ::  96%|#########6| 30338/31509 [00:52<00:01, 685.51it/s]","\rparsing log, completed traces ::  97%|#########6| 30411/31509 [00:52<00:01, 692.90it/s]","\rparsing log, completed traces ::  97%|#########6| 30481/31509 [00:52<00:01, 693.91it/s]","\rparsing log, completed traces ::  97%|#########6| 30551/31509 [00:52<00:01, 689.03it/s]","\rparsing log, completed traces ::  97%|#########7| 30624/31509 [00:52<00:01, 698.09it/s]","\rparsing log, completed traces ::  97%|#########7| 30694/31509 [00:54<00:04, 165.77it/s]","\rparsing log, completed traces ::  98%|#########7| 30762/31509 [00:54<00:03, 212.54it/s]","\rparsing log, completed traces ::  98%|#########7| 30835/31509 [00:54<00:02, 271.89it/s]","\rparsing log, completed traces ::  98%|#########8| 30902/31509 [00:54<00:01, 327.23it/s]","\rparsing log, completed traces ::  98%|#########8| 30974/31509 [00:54<00:01, 392.68it/s]","\rparsing log, completed traces ::  99%|#########8| 31042/31509 [00:54<00:01, 447.99it/s]","\rparsing log, completed traces ::  99%|#########8| 31119/31509 [00:54<00:00, 515.50it/s]","\rparsing log, completed traces ::  99%|#########8| 31191/31509 [00:54<00:00, 562.82it/s]","\rparsing log, completed traces ::  99%|#########9| 31261/31509 [00:54<00:00, 584.36it/s]","\rparsing log, completed traces ::  99%|#########9| 31330/31509 [00:54<00:00, 587.44it/s]","\rparsing log, completed traces :: 100%|#########9| 31397/31509 [00:55<00:00, 608.16it/s]","\rparsing log, completed traces :: 100%|#########9| 31466/31509 [00:55<00:00, 628.91it/s]","","\rparsing log, completed traces :: 100%|##########| 31509/31509 [00:55<00:00, 570.32it/s]","\n","[data] Loading XES: /workspace/data/Road_Traffic_Fine_Management_Process.xes","\n","\rparsing log, completed traces ::   0%|          | 0/150370 [00:00<?, ?it/s]","\rparsing log, completed traces ::   1%|          | 761/150370 [00:00<00:19, 7609.70it/s]","\rparsing log, completed traces ::   1%|1         | 1582/150370 [00:00<00:18, 7960.63it/s]","\rparsing log, completed traces ::   2%|1         | 2379/150370 [00:00<00:40, 3645.86it/s]","\rparsing log, completed traces ::   2%|2         | 3178/150370 [00:00<00:31, 4644.36it/s]","\rparsing log, completed traces ::   3%|2         | 3982/150370 [00:00<00:26, 5483.27it/s]","\rparsing log, completed traces ::   3%|3         | 4757/150370 [00:00<00:23, 6074.00it/s]","\rparsing log, completed traces ::   4%|3         | 5564/150370 [00:00<00:21, 6614.36it/s]","\rparsing log, completed traces ::   4%|4         | 6368/150370 [00:01<00:20, 7010.43it/s]","\rparsing log, completed traces ::   5%|4         | 7166/150370 [00:01<00:19, 7286.62it/s]","\rparsing log, completed traces ::   5%|5         | 7992/150370 [00:01<00:18, 7568.26it/s]","\rparsing log, completed traces ::   6%|5         | 8847/150370 [00:01<00:18, 7854.72it/s]","\rparsing log, completed traces ::   6%|6         | 9687/150370 [00:01<00:17, 8013.35it/s]","\rparsing log, completed traces ::   7%|6         | 10509/150370 [00:01<00:17, 8074.01it/s]","\rparsing log, completed traces ::   8%|7         | 11330/150370 [00:01<00:17, 8084.66it/s]","\rparsing log, completed traces ::   8%|8         | 12148/150370 [00:01<00:17, 8112.36it/s]","\rparsing log, completed traces ::   9%|8         | 12966/150370 [00:01<00:17, 8059.16it/s]","\rparsing log, completed traces ::   9%|9         | 13777/150370 [00:01<00:16, 8036.85it/s]","\rparsing log, completed traces ::  10%|9         | 14584/150370 [00:02<00:32, 4118.34it/s]","\rparsing log, completed traces ::  10%|#         | 15401/150370 [00:02<00:27, 4840.46it/s]","\rparsing log, completed traces ::  11%|#         | 16256/150370 [00:02<00:23, 5592.56it/s]","\rparsing log, completed traces ::  11%|#1        | 17124/150370 [00:02<00:21, 6286.32it/s]","\rparsing log, completed traces ::  12%|#1        | 17974/150370 [00:02<00:19, 6823.09it/s]","\rparsing log, completed traces ::  13%|#2        | 18802/150370 [00:02<00:18, 7197.98it/s]","\rparsing log, completed traces ::  13%|#3        | 19624/150370 [00:02<00:17, 7471.63it/s]","\rparsing log, completed traces ::  14%|#3        | 20440/150370 [00:03<00:16, 7660.30it/s]","\rparsing log, completed traces ::  14%|#4        | 21296/150370 [00:03<00:16, 7915.15it/s]","\rparsing log, completed traces ::  15%|#4        | 22176/150370 [00:03<00:15, 8169.53it/s]","\rparsing log, completed traces ::  15%|#5        | 23067/150370 [00:03<00:15, 8364.96it/s]","\rparsing log, completed traces ::  16%|#5        | 23922/150370 [00:03<00:15, 8248.24it/s]","\rparsing log, completed traces ::  16%|#6        | 24760/150370 [00:03<00:16, 7683.49it/s]","\rparsing log, completed traces ::  17%|#6        | 25545/150370 [00:03<00:16, 7421.85it/s]","\rparsing log, completed traces ::  17%|#7        | 26299/150370 [00:03<00:17, 7194.65it/s]","\rparsing log, completed traces ::  18%|#7        | 27027/150370 [00:03<00:17, 6993.78it/s]","\rparsing log, completed traces ::  18%|#8        | 27733/150370 [00:04<00:35, 3413.66it/s]","\rparsing log, completed traces ::  19%|#8        | 28471/150370 [00:04<00:30, 4052.56it/s]","\rparsing log, completed traces ::  19%|#9        | 29271/150370 [00:04<00:25, 4790.90it/s]","\rparsing log, completed traces ::  20%|#9        | 30022/150370 [00:04<00:22, 5355.09it/s]","\rparsing log, completed traces ::  20%|##        | 30713/150370 [00:04<00:20, 5714.04it/s]","\rparsing log, completed traces ::  21%|##        | 31400/150370 [00:04<00:19, 5974.51it/s]","\rparsing log, completed traces ::  21%|##1       | 32089/150370 [00:05<00:19, 6202.49it/s]","\rparsing log, completed traces ::  22%|##1       | 32779/150370 [00:05<00:18, 6374.13it/s]","\rparsing log, completed traces ::  22%|##2       | 33483/150370 [00:05<00:17, 6559.19it/s]","\rparsing log, completed traces ::  23%|##2       | 34193/150370 [00:05<00:17, 6713.02it/s]","\rparsing log, completed traces ::  23%|##3       | 34889/150370 [00:05<00:17, 6732.86it/s]","\rparsing log, completed traces ::  24%|##3       | 35580/150370 [00:05<00:16, 6778.05it/s]","\rparsing log, completed traces ::  24%|##4       | 36272/150370 [00:05<00:16, 6819.05it/s]","\rparsing log, completed traces ::  25%|##4       | 36979/150370 [00:05<00:16, 6891.19it/s]","\rparsing log, completed traces ::  25%|##5       | 37680/150370 [00:05<00:16, 6925.63it/s]","\rparsing log, completed traces ::  26%|##5       | 38414/150370 [00:05<00:15, 7048.09it/s]","\rparsing log, completed traces ::  26%|##6       | 39153/150370 [00:06<00:15, 7149.64it/s]","\rparsing log, completed traces ::  27%|##6       | 39894/150370 [00:06<00:15, 7226.95it/s]","\rparsing log, completed traces ::  27%|##7       | 40636/150370 [00:06<00:15, 7284.48it/s]","\rparsing log, completed traces ::  28%|##7       | 41366/150370 [00:06<00:34, 3204.72it/s]","\rparsing log, completed traces ::  28%|##8       | 42124/150370 [00:06<00:27, 3890.83it/s]","\rparsing log, completed traces ::  29%|##8       | 42872/150370 [00:06<00:23, 4551.81it/s]","\rparsing log, completed traces ::  29%|##9       | 43644/150370 [00:07<00:20, 5211.28it/s]","\rparsing log, completed traces ::  30%|##9       | 44397/150370 [00:07<00:18, 5742.45it/s]","\rparsing log, completed traces ::  30%|###       | 45123/150370 [00:07<00:17, 6116.56it/s]","\rparsing log, completed traces ::  30%|###       | 45855/150370 [00:07<00:16, 6429.04it/s]","\rparsing log, completed traces ::  31%|###       | 46576/150370 [00:07<00:15, 6639.63it/s]","\rparsing log, completed traces ::  31%|###1      | 47296/150370 [00:07<00:15, 6758.56it/s]","\rparsing log, completed traces ::  32%|###1      | 48050/150370 [00:07<00:14, 6960.43it/s]","\rparsing log, completed traces ::  33%|###2      | 48902/150370 [00:07<00:13, 7409.04it/s]","\rparsing log, completed traces ::  33%|###3      | 49689/150370 [00:07<00:13, 7541.60it/s]","\rparsing log, completed traces ::  34%|###3      | 50459/150370 [00:07<00:13, 7527.15it/s]","\rparsing log, completed traces ::  34%|###4      | 51223/150370 [00:08<00:13, 7524.15it/s]","\rparsing log, completed traces ::  35%|###4      | 51984/150370 [00:08<00:13, 7519.58it/s]","\rparsing log, completed traces ::  35%|###5      | 52746/150370 [00:08<00:12, 7548.26it/s]","\rparsing log, completed traces ::  36%|###5      | 53505/150370 [00:08<00:12, 7488.97it/s]","\rparsing log, completed traces ::  36%|###6      | 54305/150370 [00:08<00:12, 7639.73it/s]","\rparsing log, completed traces ::  37%|###6      | 55111/150370 [00:08<00:12, 7763.89it/s]","\rparsing log, completed traces ::  37%|###7      | 55889/150370 [00:08<00:12, 7743.08it/s]","\rparsing log, completed traces ::  38%|###7      | 56708/150370 [00:08<00:11, 7855.22it/s]","\rparsing log, completed traces ::  38%|###8      | 57506/150370 [00:08<00:11, 7891.47it/s]","\rparsing log, completed traces ::  39%|###8      | 58296/150370 [00:09<00:28, 3184.78it/s]","\rparsing log, completed traces ::  39%|###9      | 59029/150370 [00:09<00:24, 3792.76it/s]","\rparsing log, completed traces ::  40%|###9      | 59832/150370 [00:09<00:20, 4526.64it/s]","\rparsing log, completed traces ::  40%|####      | 60596/150370 [00:09<00:17, 5144.23it/s]","\rparsing log, completed traces ::  41%|####      | 61465/150370 [00:09<00:15, 5924.14it/s]","\rparsing log, completed traces ::  41%|####1     | 62337/150370 [00:09<00:13, 6594.30it/s]","\rparsing log, completed traces ::  42%|####1     | 63137/150370 [00:10<00:12, 6934.82it/s]","\rparsing log, completed traces ::  43%|####2     | 63929/150370 [00:10<00:12, 7190.71it/s]","\rparsing log, completed traces ::  43%|####3     | 64732/150370 [00:10<00:11, 7405.12it/s]","\rparsing log, completed traces ::  44%|####3     | 65547/150370 [00:10<00:11, 7615.13it/s]","\rparsing log, completed traces ::  44%|####4     | 66379/150370 [00:10<00:10, 7813.06it/s]","\rparsing log, completed traces ::  45%|####4     | 67202/150370 [00:10<00:10, 7933.13it/s]","\rparsing log, completed traces ::  45%|####5     | 68096/150370 [00:10<00:10, 8206.03it/s]","\rparsing log, completed traces ::  46%|####5     | 68943/150370 [00:10<00:09, 8282.51it/s]","\rparsing log, completed traces ::  46%|####6     | 69782/150370 [00:10<00:09, 8180.38it/s]","\rparsing log, completed traces ::  47%|####6     | 70608/150370 [00:11<00:09, 8134.41it/s]","\rparsing log, completed traces ::  48%|####7     | 71427/150370 [00:11<00:09, 8065.98it/s]","\rparsing log, completed traces ::  48%|####8     | 72238/150370 [00:11<00:09, 8035.81it/s]","\rparsing log, completed traces ::  49%|####8     | 73045/150370 [00:11<00:09, 7892.33it/s]","\rparsing log, completed traces ::  49%|####9     | 73837/150370 [00:11<00:09, 7729.27it/s]","\rparsing log, completed traces ::  50%|####9     | 74757/150370 [00:11<00:09, 8155.44it/s]","\rparsing log, completed traces ::  50%|#####     | 75576/150370 [00:11<00:09, 8053.83it/s]","\rparsing log, completed traces ::  51%|#####     | 76414/150370 [00:11<00:09, 8148.70it/s]","\rparsing log, completed traces ::  51%|#####1    | 77231/150370 [00:11<00:09, 8108.27it/s]","\rparsing log, completed traces ::  52%|#####1    | 78043/150370 [00:11<00:09, 7996.63it/s]","\rparsing log, completed traces ::  52%|#####2    | 78844/150370 [00:12<00:23, 3055.80it/s]","\rparsing log, completed traces ::  53%|#####2    | 79629/150370 [00:12<00:19, 3717.18it/s]","\rparsing log, completed traces ::  53%|#####3    | 80414/150370 [00:12<00:15, 4397.58it/s]","\rparsing log, completed traces ::  54%|#####3    | 81171/150370 [00:12<00:13, 5001.47it/s]","\rparsing log, completed traces ::  55%|#####4    | 81956/150370 [00:12<00:12, 5610.29it/s]","\rparsing log, completed traces ::  55%|#####5    | 82829/150370 [00:13<00:10, 6340.11it/s]","\rparsing log, completed traces ::  56%|#####5    | 83638/150370 [00:13<00:09, 6762.27it/s]","\rparsing log, completed traces ::  56%|#####6    | 84429/150370 [00:13<00:09, 7061.08it/s]","\rparsing log, completed traces ::  57%|#####6    | 85222/150370 [00:13<00:08, 7284.19it/s]","\rparsing log, completed traces ::  57%|#####7    | 86008/150370 [00:13<00:08, 7435.62it/s]","\rparsing log, completed traces ::  58%|#####7    | 86804/150370 [00:13<00:08, 7584.39it/s]","\rparsing log, completed traces ::  58%|#####8    | 87618/150370 [00:13<00:08, 7745.32it/s]","\rparsing log, completed traces ::  59%|#####8    | 88431/150370 [00:13<00:07, 7857.61it/s]","\rparsing log, completed traces ::  59%|#####9    | 89232/150370 [00:13<00:07, 7888.40it/s]","\rparsing log, completed traces ::  60%|#####9    | 90056/150370 [00:13<00:07, 7992.21it/s]","\rparsing log, completed traces ::  60%|######    | 90878/150370 [00:14<00:07, 8037.46it/s]","\rparsing log, completed traces ::  61%|######    | 91688/150370 [00:14<00:07, 8047.68it/s]","\rparsing log, completed traces ::  62%|######1   | 92497/150370 [00:14<00:07, 8035.17it/s]","\rparsing log, completed traces ::  62%|######2   | 93304/150370 [00:14<00:07, 8040.99it/s]","\rparsing log, completed traces ::  63%|######2   | 94116/150370 [00:14<00:06, 8063.87it/s]","\rparsing log, completed traces ::  63%|######3   | 94965/150370 [00:14<00:06, 8170.52it/s]","\rparsing log, completed traces ::  64%|######3   | 95791/150370 [00:14<00:06, 8197.16it/s]","\rparsing log, completed traces ::  64%|######4   | 96612/150370 [00:14<00:06, 8116.11it/s]","\rparsing log, completed traces ::  65%|######4   | 97425/150370 [00:14<00:06, 8055.02it/s]","\rparsing log, completed traces ::  65%|######5   | 98231/150370 [00:14<00:06, 8047.43it/s]","\rparsing log, completed traces ::  66%|######5   | 99044/150370 [00:15<00:06, 8069.70it/s]","\rparsing log, completed traces ::  66%|######6   | 99852/150370 [00:15<00:06, 7999.28it/s]","\rparsing log, completed traces ::  67%|######6   | 100661/150370 [00:15<00:06, 8024.91it/s]","\rparsing log, completed traces ::  67%|######7   | 101465/150370 [00:15<00:06, 8015.27it/s]","\rparsing log, completed traces ::  68%|######8   | 102274/150370 [00:15<00:05, 8036.39it/s]","\rparsing log, completed traces ::  69%|######8   | 103078/150370 [00:16<00:16, 2793.99it/s]","\rparsing log, completed traces ::  69%|######9   | 103864/150370 [00:16<00:13, 3448.02it/s]","\rparsing log, completed traces ::  70%|######9   | 104642/150370 [00:16<00:11, 4113.97it/s]","\rparsing log, completed traces ::  70%|#######   | 105417/150370 [00:16<00:09, 4774.16it/s]","\rparsing log, completed traces ::  71%|#######   | 106194/150370 [00:16<00:08, 5390.65it/s]","\rparsing log, completed traces ::  71%|#######1  | 106960/150370 [00:16<00:07, 5895.50it/s]","\rparsing log, completed traces ::  72%|#######1  | 107735/150370 [00:16<00:06, 6348.94it/s]","\rparsing log, completed traces ::  72%|#######2  | 108499/150370 [00:16<00:06, 6683.04it/s]","\rparsing log, completed traces ::  73%|#######2  | 109271/150370 [00:17<00:05, 6962.80it/s]","\rparsing log, completed traces ::  73%|#######3  | 110047/150370 [00:17<00:05, 7182.93it/s]","\rparsing log, completed traces ::  74%|#######3  | 110821/150370 [00:17<00:05, 7319.29it/s]","\rparsing log, completed traces ::  74%|#######4  | 111606/150370 [00:17<00:05, 7471.50it/s]","\rparsing log, completed traces ::  75%|#######4  | 112377/150370 [00:17<00:05, 7534.27it/s]","\rparsing log, completed traces ::  75%|#######5  | 113148/150370 [00:17<00:04, 7541.41it/s]","\rparsing log, completed traces ::  76%|#######5  | 114015/150370 [00:17<00:04, 7858.82it/s]","\rparsing log, completed traces ::  76%|#######6  | 114993/150370 [00:17<00:04, 8404.15it/s]","\rparsing log, completed traces ::  77%|#######7  | 115948/150370 [00:17<00:03, 8742.80it/s]","\rparsing log, completed traces ::  78%|#######7  | 116947/150370 [00:17<00:03, 9113.31it/s]","\rparsing log, completed traces ::  78%|#######8  | 117863/150370 [00:18<00:03, 8973.64it/s]","\rparsing log, completed traces ::  79%|#######8  | 118764/150370 [00:18<00:03, 8390.90it/s]","\rparsing log, completed traces ::  80%|#######9  | 119613/150370 [00:18<00:03, 8016.59it/s]","\rparsing log, completed traces ::  80%|########  | 120424/150370 [00:18<00:03, 7805.91it/s]","\rparsing log, completed traces ::  81%|########  | 121211/150370 [00:18<00:03, 7632.61it/s]","\rparsing log, completed traces ::  81%|########1 | 121979/150370 [00:18<00:03, 7525.72it/s]","\rparsing log, completed traces ::  82%|########1 | 122734/150370 [00:18<00:03, 7489.99it/s]","\rparsing log, completed traces ::  82%|########2 | 123485/150370 [00:18<00:03, 7451.34it/s]","\rparsing log, completed traces ::  83%|########2 | 124232/150370 [00:18<00:03, 7287.81it/s]","\rparsing log, completed traces ::  83%|########3 | 124962/150370 [00:19<00:03, 7249.13it/s]","\rparsing log, completed traces ::  84%|########3 | 125704/150370 [00:19<00:03, 7297.88it/s]","\rparsing log, completed traces ::  84%|########4 | 126440/150370 [00:19<00:03, 7315.48it/s]","\rparsing log, completed traces ::  85%|########4 | 127190/150370 [00:19<00:03, 7368.37it/s]","\rparsing log, completed traces ::  85%|########5 | 127928/150370 [00:19<00:03, 7352.74it/s]","\rparsing log, completed traces ::  86%|########5 | 128685/150370 [00:19<00:02, 7416.90it/s]","\rparsing log, completed traces ::  86%|########6 | 129432/150370 [00:20<00:08, 2327.83it/s]","\rparsing log, completed traces ::  87%|########6 | 130188/150370 [00:20<00:06, 2941.43it/s]","\rparsing log, completed traces ::  87%|########7 | 130943/150370 [00:20<00:05, 3603.81it/s]","\rparsing log, completed traces ::  88%|########7 | 131714/150370 [00:20<00:04, 4303.13it/s]","\rparsing log, completed traces ::  88%|########8 | 132583/150370 [00:20<00:03, 5158.18it/s]","\rparsing log, completed traces ::  89%|########8 | 133423/150370 [00:20<00:02, 5865.95it/s]","\rparsing log, completed traces ::  89%|########9 | 134194/150370 [00:20<00:02, 6268.81it/s]","\rparsing log, completed traces ::  90%|########9 | 134960/150370 [00:21<00:02, 6608.29it/s]","\rparsing log, completed traces ::  90%|######### | 135724/150370 [00:21<00:02, 6804.90it/s]","\rparsing log, completed traces ::  91%|######### | 136479/150370 [00:21<00:01, 6961.12it/s]","\rparsing log, completed traces ::  91%|#########1| 137229/150370 [00:21<00:01, 7069.48it/s]","\rparsing log, completed traces ::  92%|#########1| 137974/150370 [00:21<00:01, 7138.36it/s]","\rparsing log, completed traces ::  92%|#########2| 138722/150370 [00:21<00:01, 7229.34it/s]","\rparsing log, completed traces ::  93%|#########2| 139471/150370 [00:21<00:01, 7293.45it/s]","\rparsing log, completed traces ::  93%|#########3| 140232/150370 [00:21<00:01, 7380.24it/s]","\rparsing log, completed traces ::  94%|#########3| 140997/150370 [00:21<00:01, 7458.48it/s]","\rparsing log, completed traces ::  94%|#########4| 141788/150370 [00:21<00:01, 7591.32it/s]","\rparsing log, completed traces ::  95%|#########4| 142553/150370 [00:22<00:01, 7594.95it/s]","\rparsing log, completed traces ::  95%|#########5| 143319/150370 [00:22<00:00, 7614.20it/s]","\rparsing log, completed traces ::  96%|#########5| 144094/150370 [00:22<00:00, 7649.96it/s]","\rparsing log, completed traces ::  96%|#########6| 144861/150370 [00:22<00:00, 7561.03it/s]","\rparsing log, completed traces ::  97%|#########6| 145619/150370 [00:22<00:00, 7174.16it/s]","\rparsing log, completed traces ::  97%|#########7| 146342/150370 [00:22<00:00, 6643.37it/s]","\rparsing log, completed traces ::  98%|#########7| 147017/150370 [00:22<00:00, 6452.48it/s]","\rparsing log, completed traces ::  98%|#########8| 147669/150370 [00:22<00:00, 6340.51it/s]","\rparsing log, completed traces ::  99%|#########8| 148308/150370 [00:22<00:00, 6272.22it/s]","\rparsing log, completed traces ::  99%|#########9| 148963/150370 [00:23<00:00, 6349.01it/s]","\rparsing log, completed traces :: 100%|#########9| 149635/150370 [00:23<00:00, 6436.81it/s]","\rparsing log, completed traces :: 100%|#########9| 150356/150370 [00:23<00:00, 6660.35it/s]","","\rparsing log, completed traces :: 100%|##########| 150370/150370 [00:23<00:00, 6465.54it/s]","\n","[data] Loaded datasets: ['BPI2012', 'BPI2017', 'ROAD']","\n","\n=== Dataset: BPI2012 ===","\n","Samples train/val/test: 22252/4176/4196; vocab=23","\n","Epoch 1: validation_loss = 0.5594 | val_acc=0.7409 | val_f1=0.5316 | val_top3=0.9840","\n","Epoch 2: validation_loss = 0.5308 | val_acc=0.7598 | val_f1=0.5425 | val_top3=0.9854","\n","Epoch 3: validation_loss = 0.5333 | val_acc=0.7574 | val_f1=0.5725 | val_top3=0.9859","\n","Epoch 4: validation_loss = 0.5195 | val_acc=0.7629 | val_f1=0.5835 | val_top3=0.9861","\n","Epoch 5: validation_loss = 0.5221 | val_acc=0.7450 | val_f1=0.6007 | val_top3=0.9854","\n","Epoch 6: validation_loss = 0.5249 | val_acc=0.7634 | val_f1=0.5833 | val_top3=0.9861","\n","Epoch 7: validation_loss = 0.5073 | val_acc=0.7639 | val_f1=0.5909 | val_top3=0.9856","\n","Epoch 8: validation_loss = 0.5113 | val_acc=0.7593 | val_f1=0.5790 | val_top3=0.9859","\n","Epoch 9: validation_loss = 0.5105 | val_acc=0.7639 | val_f1=0.5842 | val_top3=0.9852","\n","Epoch 10: validation_loss = 0.5201 | val_acc=0.7634 | val_f1=0.5797 | val_top3=0.9847","\n","[BPI2012] Train: loss=0.5148 acc=0.7777 f1=0.5609 top3=0.9868","\n","[BPI2012] Test:  loss=0.5355 acc=0.7569 f1=0.5872 top3=0.9874","\n","\n=== Dataset: BPI2017 ===","\n","Samples train/val/test: 34519/7403/7374; vocab=24","\n","Epoch 1: validation_loss = 0.4172 | val_acc=0.8368 | val_f1=0.5299 | val_top3=0.9904","\n","Epoch 2: validation_loss = 0.4004 | val_acc=0.8367 | val_f1=0.5595 | val_top3=0.9907","\n","Epoch 3: validation_loss = 0.3864 | val_acc=0.8384 | val_f1=0.5719 | val_top3=0.9912","\n","Epoch 4: validation_loss = 0.3847 | val_acc=0.8395 | val_f1=0.5903 | val_top3=0.9919","\n","Epoch 5: validation_loss = 0.3812 | val_acc=0.8405 | val_f1=0.5856 | val_top3=0.9922","\n","Epoch 6: validation_loss = 0.3802 | val_acc=0.8376 | val_f1=0.5896 | val_top3=0.9916","\n","Epoch 7: validation_loss = 0.3769 | val_acc=0.8361 | val_f1=0.5957 | val_top3=0.9924","\n","Epoch 8: validation_loss = 0.3799 | val_acc=0.8386 | val_f1=0.6180 | val_top3=0.9927","\n","Epoch 9: validation_loss = 0.3805 | val_acc=0.8391 | val_f1=0.5989 | val_top3=0.9926","\n","Epoch 10: validation_loss = 0.3756 | val_acc=0.8399 | val_f1=0.6155 | val_top3=0.9928","\n","[BPI2017] Train: loss=0.3607 acc=0.8422 f1=0.5721 top3=0.9941","\n","[BPI2017] Test:  loss=0.3877 acc=0.8332 f1=0.5710 top3=0.9906","\n","\n=== Dataset: ROAD ===","\n","Samples train/val/test: 8707/1928/1869; vocab=11","\n","Epoch 1: validation_loss = 0.4913 | val_acc=0.7993 | val_f1=0.3684 | val_top3=0.9922","\n","Epoch 2: validation_loss = 0.4561 | val_acc=0.8086 | val_f1=0.4514 | val_top3=0.9948","\n","Epoch 3: validation_loss = 0.4566 | val_acc=0.8091 | val_f1=0.5300 | val_top3=0.9969","\n","Epoch 4: validation_loss = 0.4482 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 5: validation_loss = 0.4355 | val_acc=0.8112 | val_f1=0.6427 | val_top3=0.9969","\n","Epoch 6: validation_loss = 0.4334 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 7: validation_loss = 0.4328 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 8: validation_loss = 0.4334 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 9: validation_loss = 0.4274 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 10: validation_loss = 0.4329 | val_acc=0.8122 | val_f1=0.6664 | val_top3=0.9969","\n","[ROAD] Train: loss=0.4662 acc=0.7894 f1=0.5395 top3=0.9986","\n","[ROAD] Test:  loss=0.4833 acc=0.8020 f1=0.4740 top3=0.9936","\n","Execution time: 3 minutes seconds (time limit is an hour)."],"parse_metrics_plan":"I will load the numpy file from the specified working directory, parse the nested experiment_data structure, and compute final or best metrics as requested. For training and test, I will report the final metrics saved in the structure. For validation, I will compute the best values across epochs for accuracy, F1 score, and top-3 accuracy, and the minimum validation loss using the recorded loss history. The script prints the dataset name followed by clearly labeled metrics and executes immediately.","parse_metrics_code":"import os\nimport numpy as np\n\n\ndef safe_get(d, *keys, default=None):\n    cur = d\n    for k in keys:\n        if isinstance(cur, dict) and k in cur:\n            cur = cur[k]\n        else:\n            return default\n    return cur\n\n\ndef load_experiment_data():\n    working_dir = os.path.join(os.getcwd(), \"working\")\n    path = os.path.join(working_dir, \"experiment_data.npy\")\n    if not os.path.isfile(path):\n        raise FileNotFoundError(f\"File not found: {path}\")\n    data = np.load(path, allow_pickle=True).item()\n    if not isinstance(data, dict):\n        raise ValueError(\"Loaded experiment_data is not a dict.\")\n    return data\n\n\ndef extract_final_train_metrics(ds_data):\n    # Expect a 'final' entry\n    train_entries = safe_get(ds_data, \"metrics\", \"train\", default=[])\n    final = None\n    for tag, vals in train_entries:\n        if tag == \"final\":\n            final = vals\n    out = {}\n    if final:\n        out[\"train loss\"] = final.get(\"loss\", None)\n        out[\"train accuracy\"] = final.get(\"acc\", None)\n        out[\"train F1 score\"] = final.get(\"macro_f1\", None)\n        out[\"train top-3 accuracy\"] = final.get(\"top3\", None)\n    else:\n        # Fallback: try last value from losses for loss only\n        train_losses = safe_get(ds_data, \"losses\", \"train\", default=[])\n        if train_losses:\n            out[\"train loss\"] = train_losses[-1][1]\n    return out\n\n\ndef extract_best_val_metrics(ds_data):\n    # Collect per-epoch validation metrics (acc, macro_f1, top3)\n    val_entries = safe_get(ds_data, \"metrics\", \"val\", default=[])\n    best = {\n        \"validation accuracy\": None,\n        \"validation F1 score\": None,\n        \"validation top-3 accuracy\": None,\n    }\n    for tag, vals in val_entries:\n        if isinstance(vals, dict):\n            acc = vals.get(\"acc\", None)\n            f1 = vals.get(\"macro_f1\", None)\n            top3 = vals.get(\"top3\", None)\n            if acc is not None:\n                best[\"validation accuracy\"] = (\n                    acc\n                    if best[\"validation accuracy\"] is None\n                    else max(best[\"validation accuracy\"], acc)\n                )\n            if f1 is not None:\n                best[\"validation F1 score\"] = (\n                    f1\n                    if best[\"validation F1 score\"] is None\n                    else max(best[\"validation F1 score\"], f1)\n                )\n            if top3 is not None:\n                best[\"validation top-3 accuracy\"] = (\n                    top3\n                    if best[\"validation top-3 accuracy\"] is None\n                    else max(best[\"validation top-3 accuracy\"], top3)\n                )\n    # For validation loss, use recorded losses per epoch and take the minimum\n    val_losses = safe_get(ds_data, \"losses\", \"val\", default=[])\n    if val_losses:\n        min_val_loss = min((v for (_, v) in val_losses), default=None)\n    else:\n        # fallback: check 'final' val entry if present\n        min_val_loss = None\n        for tag, vals in val_entries:\n            if tag == \"final\" and isinstance(vals, dict):\n                min_val_loss = vals.get(\"loss\", None)\n                break\n    out = {\"validation loss\": min_val_loss}\n    out.update(best)\n    return out\n\n\ndef extract_final_test_metrics(ds_data):\n    test_entries = safe_get(ds_data, \"metrics\", \"test\", default=[])\n    final = None\n    for tag, vals in test_entries:\n        if tag == \"final\":\n            final = vals\n    out = {}\n    if final:\n        out[\"test loss\"] = final.get(\"loss\", None)\n        out[\"test accuracy\"] = final.get(\"acc\", None)\n        out[\"test F1 score\"] = final.get(\"macro_f1\", None)\n        out[\"test top-3 accuracy\"] = final.get(\"top3\", None)\n    return out\n\n\ndef format_print_metrics(dataset_name, metrics_dict):\n    print(dataset_name)\n    # Keep a consistent order for readability\n    ordered_keys = [\n        \"train loss\",\n        \"train accuracy\",\n        \"train F1 score\",\n        \"train top-3 accuracy\",\n        \"validation loss\",\n        \"validation accuracy\",\n        \"validation F1 score\",\n        \"validation top-3 accuracy\",\n        \"test loss\",\n        \"test accuracy\",\n        \"test F1 score\",\n        \"test top-3 accuracy\",\n    ]\n    printed_any = False\n    for k in ordered_keys:\n        if k in metrics_dict and metrics_dict[k] is not None:\n            val = metrics_dict[k]\n            if isinstance(val, float):\n                print(f\"{k}: {val:.4f}\")\n            else:\n                print(f\"{k}: {val}\")\n            printed_any = True\n    # Print any remaining keys that were not in the ordered list\n    for k, v in metrics_dict.items():\n        if k not in ordered_keys and v is not None:\n            if isinstance(v, float):\n                print(f\"{k}: {v:.4f}\")\n            else:\n                print(f\"{k}: {v}\")\n            printed_any = True\n    if not printed_any:\n        print(\"No metrics available\")\n\n\ndef run():\n    experiment_data = load_experiment_data()\n    for ds_name, ds_data in experiment_data.items():\n        all_metrics = {}\n        all_metrics.update(extract_final_train_metrics(ds_data))\n        all_metrics.update(extract_best_val_metrics(ds_data))\n        all_metrics.update(extract_final_test_metrics(ds_data))\n        format_print_metrics(ds_name, all_metrics)\n\n\n# Execute immediately\nrun()\n","parse_term_out":["BPI2012","\n","train loss: 0.5148","\n","train accuracy: 0.7777","\n","train F1 score: 0.5609","\n","train top-3 accuracy: 0.9868","\n","validation loss: 0.5073","\n","validation accuracy: 0.7639","\n","validation F1 score: 0.6007","\n","validation top-3 accuracy: 0.9861","\n","test loss: 0.5355","\n","test accuracy: 0.7569","\n","test F1 score: 0.5872","\n","test top-3 accuracy: 0.9874","\n","BPI2017","\n","train loss: 0.3607","\n","train accuracy: 0.8422","\n","train F1 score: 0.5721","\n","train top-3 accuracy: 0.9941","\n","validation loss: 0.3756","\n","validation accuracy: 0.8405","\n","validation F1 score: 0.6180","\n","validation top-3 accuracy: 0.9928","\n","test loss: 0.3877","\n","test accuracy: 0.8332","\n","test F1 score: 0.5710","\n","test top-3 accuracy: 0.9906","\n","ROAD","\n","train loss: 0.4662","\n","train accuracy: 0.7894","\n","train F1 score: 0.5395","\n","train top-3 accuracy: 0.9986","\n","validation loss: 0.4274","\n","validation accuracy: 0.8122","\n","validation F1 score: 0.6664","\n","validation top-3 accuracy: 0.9969","\n","test loss: 0.4833","\n","test accuracy: 0.8020","\n","test F1 score: 0.4740","\n","test top-3 accuracy: 0.9936","\n","Execution time: a moment seconds (time limit is an hour)."],"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":237.2300136089325,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"Overall run completed successfully with valid time-based splits, per-log evaluation on BPI 2012/2017 and ROAD, and required next-activity metrics (acc/macro-F1/top-3). However, there is a latent bug in build_prefix_dataset regarding lifecycle filtering fallback: df is filtered to lifecycle=='complete' and if that results in an empty dataframe, the fallback mistakenly does df = df.copy() (copying the empty df) and then sorts it, thereby losing the original unfiltered events. This would silently produce zero samples on logs lacking explicit 'complete' transitions. Fix: preserve the original dataframe before filtering and revert to it when the filtered result is empty, e.g., df_orig = df.copy(); df_f = df[df['lifecycle'].astype(str).str.lower().eq('complete')]; df = df_f if len(df_f)>0 else df_orig; then sort by ['case_id','timestamp']. Additionally, for stricter no-leakage hygiene, build the activity vocabulary and any feature normalization strictly on the train split (the code already re-normalizes by train stats, but vocab is constructed on all data), although this is not a runtime bug. All other components (loss, target indexing, top-3 computation, saving artifacts) appear consistent with the output logs.","exp_results_dir":null,"metric":{"value":{"metric_names":[{"metric_name":"train loss","lower_is_better":true,"description":"Training loss at the end of training","data":[{"dataset_name":"BPI2012","final_value":0.5148,"best_value":0.5148},{"dataset_name":"BPI2017","final_value":0.3607,"best_value":0.3607},{"dataset_name":"ROAD","final_value":0.4662,"best_value":0.4662}]},{"metric_name":"train accuracy","lower_is_better":false,"description":"Training accuracy at the end of training","data":[{"dataset_name":"BPI2012","final_value":0.7777,"best_value":0.7777},{"dataset_name":"BPI2017","final_value":0.8422,"best_value":0.8422},{"dataset_name":"ROAD","final_value":0.7894,"best_value":0.7894}]},{"metric_name":"train F1 score","lower_is_better":false,"description":"Training F1 score at the end of training","data":[{"dataset_name":"BPI2012","final_value":0.5609,"best_value":0.5609},{"dataset_name":"BPI2017","final_value":0.5721,"best_value":0.5721},{"dataset_name":"ROAD","final_value":0.5395,"best_value":0.5395}]},{"metric_name":"train top-3 accuracy","lower_is_better":false,"description":"Training top-3 accuracy at the end of training","data":[{"dataset_name":"BPI2012","final_value":0.9868,"best_value":0.9868},{"dataset_name":"BPI2017","final_value":0.9941,"best_value":0.9941},{"dataset_name":"ROAD","final_value":0.9986,"best_value":0.9986}]},{"metric_name":"validation loss","lower_is_better":true,"description":"Validation loss at the end of training","data":[{"dataset_name":"BPI2012","final_value":0.5073,"best_value":0.5073},{"dataset_name":"BPI2017","final_value":0.3756,"best_value":0.3756},{"dataset_name":"ROAD","final_value":0.4274,"best_value":0.4274}]},{"metric_name":"validation accuracy","lower_is_better":false,"description":"Validation accuracy at the end of training","data":[{"dataset_name":"BPI2012","final_value":0.7639,"best_value":0.7639},{"dataset_name":"BPI2017","final_value":0.8405,"best_value":0.8405},{"dataset_name":"ROAD","final_value":0.8122,"best_value":0.8122}]},{"metric_name":"validation F1 score","lower_is_better":false,"description":"Validation F1 score at the end of training","data":[{"dataset_name":"BPI2012","final_value":0.6007,"best_value":0.6007},{"dataset_name":"BPI2017","final_value":0.618,"best_value":0.618},{"dataset_name":"ROAD","final_value":0.6664,"best_value":0.6664}]},{"metric_name":"validation top-3 accuracy","lower_is_better":false,"description":"Validation top-3 accuracy at the end of training","data":[{"dataset_name":"BPI2012","final_value":0.9861,"best_value":0.9861},{"dataset_name":"BPI2017","final_value":0.9928,"best_value":0.9928},{"dataset_name":"ROAD","final_value":0.9969,"best_value":0.9969}]},{"metric_name":"test loss","lower_is_better":true,"description":"Test loss at evaluation time","data":[{"dataset_name":"BPI2012","final_value":0.5355,"best_value":0.5355},{"dataset_name":"BPI2017","final_value":0.3877,"best_value":0.3877},{"dataset_name":"ROAD","final_value":0.4833,"best_value":0.4833}]},{"metric_name":"test accuracy","lower_is_better":false,"description":"Test accuracy at evaluation time","data":[{"dataset_name":"BPI2012","final_value":0.7569,"best_value":0.7569},{"dataset_name":"BPI2017","final_value":0.8332,"best_value":0.8332},{"dataset_name":"ROAD","final_value":0.802,"best_value":0.802}]},{"metric_name":"test F1 score","lower_is_better":false,"description":"Test F1 score at evaluation time","data":[{"dataset_name":"BPI2012","final_value":0.5872,"best_value":0.5872},{"dataset_name":"BPI2017","final_value":0.571,"best_value":0.571},{"dataset_name":"ROAD","final_value":0.474,"best_value":0.474}]},{"metric_name":"test top-3 accuracy","lower_is_better":false,"description":"Test top-3 accuracy at evaluation time","data":[{"dataset_name":"BPI2012","final_value":0.9874,"best_value":0.9874},{"dataset_name":"BPI2017","final_value":0.9906,"best_value":0.9906},{"dataset_name":"ROAD","final_value":0.9936,"best_value":0.9936}]}]},"maximize":null,"name":null,"description":null},"is_buggy":true,"is_buggy_plots":null,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":[],"plot_paths":[],"plot_analyses":[],"vlm_feedback_summary":[],"datasets_successfully_tested":[],"ablation_name":null,"hyperparam_name":null,"is_seed_node":true,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"# Set random seed\nimport random\nimport numpy as np\nimport torch\n\nseed = 1\nrandom.seed(seed)\nnp.random.seed(seed)\ntorch.manual_seed(seed)\nif torch.cuda.is_available():\n    torch.cuda.manual_seed(seed)\n\nimport os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score\nimport random\nimport math\nimport matplotlib.pyplot as plt\n\n# Device handling (required)\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n# Experiment data structure\nexperiment_data = {\n    \"BPI2012\": {\n        \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n        \"losses\": {\"train\": [], \"val\": []},\n        \"predictions\": [],\n        \"ground_truth\": [],\n        \"epochs\": [],\n    },\n    \"BPI2017\": {\n        \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n        \"losses\": {\"train\": [], \"val\": []},\n        \"predictions\": [],\n        \"ground_truth\": [],\n        \"epochs\": [],\n    },\n    \"ROAD\": {\n        \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n        \"losses\": {\"train\": [], \"val\": []},\n        \"predictions\": [],\n        \"ground_truth\": [],\n        \"epochs\": [],\n    },\n}\n\n# Data loading utilities (use provided helper)\nfrom ai_scientist.ideas.my_research_topic import load_datasets, pick_default_dataset\n\n\n# Reproducibility\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# Build prefixes\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    # Keep only 'complete' transitions if lifecycle exists\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n        if len(df) == 0:\n            df = df.copy()  # fallback if empty\n            df = df.sort_values([\"case_id\", \"timestamp\"])\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    # Build activity vocab\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}  # 0 for PAD\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        # Convert to numpy arrays for safe positional indexing\n        ts_ns = (\n            pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy()\n        )  # nanoseconds\n        ts = (ts_ns // 10**9).astype(np.int64)  # seconds as numpy array\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str).tolist()], dtype=np.int64\n        )\n        # simple calendar features\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        # time deltas and since start in seconds\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(\n            np.float32\n        )  # [T,5]\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        # Generate prefixes of length k (min_prefix_len..min(max_prefix_len, T-1)); target = activity at position k\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            seq_acts = acts_ids[:k].tolist()\n            seq_feats = feats[:k]\n            target = int(acts_ids[k])\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": seq_acts,\n                    \"seq_feats\": seq_feats.copy(),\n                    \"target\": target,\n                    \"last_ts\": int(ts[k - 1]),\n                    \"next_ts\": int(ts[k]),\n                }\n            )\n\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n\n    # Collect feature normalization stats over all feats (initial; will be recomputed on train split)\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n    ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n    for s in samples:\n        if s[\"seq_feats\"].shape[0] > 0:\n            s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n            s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\n# Time-based split by case start time\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)  # includes PAD index\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)  # [B,T,emb]\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    out = {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, preds_probs = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            preds_probs.append(probs.detach().cpu().numpy())\n            # top-3 correctness\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys)\n    y_pred = np.array(preds_top1)\n    mask = y_true != pad_idx\n    y_true = y_true[mask]\n    y_pred = y_pred[mask]\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    probs_concat = (\n        np.concatenate(preds_probs, axis=0)\n        if len(preds_probs) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return avg_loss, acc, f1, top3, y_true, y_pred, probs_concat\n\n\ndef train_one_dataset(\n    name, df, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n):\n    print(f\"\\n=== Dataset: {name} ===\")\n    # Time-based split\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    # Build samples across all to get vocab; we'll re-normalize with train stats\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    # Filter per split\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # Recompute normalization using train samples only\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm_samples(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm_samples(samples_train)\n            norm_samples(samples_val)\n            norm_samples(samples_test)\n    print(\n        f\"Samples train/val/test: {len(samples_train)}/{len(samples_val)}/{len(samples_test)}; vocab={len(act2id)}\"\n    )\n    if len(samples_train) == 0 or len(act2id) < 2:\n        print(\"Not enough data to train. Skipping.\")\n        return\n    ds_train = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_val = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_test = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=True,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_test = DataLoader(\n        ds_test,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n\n    # Model\n    model = LSTMBaseline(\n        vocab_size=len(act2id),\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    # Training loop\n    best_val_top3 = -1.0\n    best_state = None\n    hist = {\"train_loss\": [], \"val_loss\": [], \"val_top3\": []}\n    for epoch in range(1, max_epochs + 1):\n        model.train()\n        total = 0\n        running_loss = 0.0\n        for batch in dl_train:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            optimizer.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item() * logits.size(0)\n            total += logits.size(0)\n        train_loss = running_loss / max(1, total)\n        val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n            model, dl_val, criterion, device, len(act2id), pad_id\n        )\n        print(\n            f\"Epoch {epoch}: validation_loss = {val_loss:.4f} | val_acc={val_acc:.4f} | val_f1={val_f1:.4f} | val_top3={val_top3:.4f}\"\n        )\n        hist[\"train_loss\"].append(train_loss)\n        hist[\"val_loss\"].append(val_loss)\n        hist[\"val_top3\"].append(val_top3)\n        experiment_data[name][\"losses\"][\"train\"].append((epoch, train_loss))\n        experiment_data[name][\"losses\"][\"val\"].append((epoch, val_loss))\n        experiment_data[name][\"metrics\"][\"val\"].append(\n            (epoch, {\"acc\": val_acc, \"macro_f1\": val_f1, \"top3\": val_top3})\n        )\n        experiment_data[name][\"epochs\"].append(epoch)\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_state = {k: v.cpu().clone() for k, v in model.state_dict().items()}\n\n    # Load best\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n\n    # Final eval on train/val/test\n    train_loss, train_acc, train_f1, train_top3, _, _, _ = evaluate(\n        model, dl_train, criterion, device, len(act2id), pad_id\n    )\n    val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n        model, dl_val, criterion, device, len(act2id), pad_id\n    )\n    test_loss, test_acc, test_f1, test_top3, y_true_t, y_pred_t, probs_t = evaluate(\n        model, dl_test, criterion, device, len(act2id), pad_id\n    )\n    print(\n        f\"[{name}] Train: loss={train_loss:.4f} acc={train_acc:.4f} f1={train_f1:.4f} top3={train_top3:.4f}\"\n    )\n    print(\n        f\"[{name}] Test:  loss={test_loss:.4f} acc={test_acc:.4f} f1={test_f1:.4f} top3={test_top3:.4f}\"\n    )\n\n    # Save metrics\n    experiment_data[name][\"metrics\"][\"train\"].append(\n        (\n            \"final\",\n            {\n                \"loss\": train_loss,\n                \"acc\": train_acc,\n                \"macro_f1\": train_f1,\n                \"top3\": train_top3,\n            },\n        )\n    )\n    experiment_data[name][\"metrics\"][\"val\"].append(\n        (\n            \"final\",\n            {\"loss\": val_loss, \"acc\": val_acc, \"macro_f1\": val_f1, \"top3\": val_top3},\n        )\n    )\n    experiment_data[name][\"metrics\"][\"test\"].append(\n        (\n            \"final\",\n            {\n                \"loss\": test_loss,\n                \"acc\": test_acc,\n                \"macro_f1\": test_f1,\n                \"top3\": test_top3,\n            },\n        )\n    )\n    experiment_data[name][\"predictions\"] = y_pred_t.tolist()\n    experiment_data[name][\"ground_truth\"] = y_true_t.tolist()\n\n    # Plots\n    try:\n        plt.figure()\n        plt.plot(hist[\"train_loss\"], label=\"train_loss\")\n        plt.plot(hist[\"val_loss\"], label=\"val_loss\")\n        plt.legend()\n        plt.title(f\"Loss Curves - {name}\")\n        plt.xlabel(\"Epoch\")\n        plt.ylabel(\"Loss\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"loss_curves_{name}.png\"))\n        plt.close()\n\n        plt.figure()\n        plt.plot(hist[\"val_top3\"], label=\"val_top3\")\n        plt.legend()\n        plt.title(f\"Val Top-3 Acc - {name}\")\n        plt.xlabel(\"Epoch\")\n        plt.ylabel(\"Top-3 Acc\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"val_top3_{name}.png\"))\n        plt.close()\n    except Exception as e:\n        print(f\"[warn] Plotting failed: {e}\")\n\n    # Save confusion matrix-like data (optional)\n    try:\n        from sklearn.metrics import confusion_matrix\n\n        cm = confusion_matrix(y_true_t, y_pred_t)\n        np.save(os.path.join(working_dir, f\"cm_{name}.npy\"), cm)\n    except Exception as e:\n        print(f\"[warn] Confusion matrix failed: {e}\")\n\n\ndef main():\n    datasets = load_datasets()\n    # Loop through loaded datasets; cap to 5000 earliest cases for speed\n    for key, df in datasets.items():\n        try:\n            starts = (\n                df.sort_values(\"timestamp\")\n                .groupby(\"case_id\")[\"timestamp\"]\n                .min()\n                .reset_index()\n            )\n            if len(starts) > 5000:\n                keep_cases = set(starts.iloc[:5000][\"case_id\"])\n                df_small = df[df[\"case_id\"].isin(keep_cases)].copy()\n            else:\n                df_small = df\n        except Exception:\n            df_small = df\n        train_one_dataset(\n            key, df_small, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n        )\n    # Save experiment data\n    np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n    np.savez_compressed(\n        os.path.join(working_dir, \"experiment_data_compressed.npz\"),\n        data=experiment_data,\n    )\n\n\n# Execute immediately\nmain()\n","plan":"Seed node","overall_plan":"","plot_code":"import matplotlib.pyplot as plt\nimport numpy as np\nimport os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import (\n    f1_score,\n    accuracy_score,\n    confusion_matrix,\n    precision_recall_curve,\n    average_precision_score,\n)\nfrom sklearn.preprocessing import label_binarize\nimport random\nimport math\nfrom collections import defaultdict\n\n# Reproducibility and device\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# --------- Data loading from local XES via pm4py ----------\ndef load_xes_folder(data_dir=\"data\"):\n    datasets = {}\n    try:\n        import pm4py\n    except Exception as e:\n        print(f\"pm4py not available: {e}\")\n        return datasets\n    if not os.path.isdir(data_dir):\n        print(f\"Data directory not found: {data_dir}\")\n        return datasets\n    for fn in os.listdir(data_dir):\n        if fn.lower().endswith(\".xes\") or fn.lower().endswith(\".xes.gz\"):\n            path = os.path.join(data_dir, fn)\n            try:\n                log = pm4py.read_xes(path)\n                df = pm4py.convert_to_dataframe(log)\n                # Standardize columns\n                # pm4py dataframe typically has case:concept:name, concept:name, time:timestamp, lifecycle:transition\n                cols = df.columns\n                case_col = (\n                    \"case:concept:name\"\n                    if \"case:concept:name\" in cols\n                    else (\"case\" if \"case\" in cols else None)\n                )\n                act_col = (\n                    \"concept:name\"\n                    if \"concept:name\" in cols\n                    else (\"activity\" if \"activity\" in cols else None)\n                )\n                ts_col = (\n                    \"time:timestamp\"\n                    if \"time:timestamp\" in cols\n                    else (\"timestamp\" if \"timestamp\" in cols else None)\n                )\n                life_col = (\n                    \"lifecycle:transition\"\n                    if \"lifecycle:transition\" in cols\n                    else (\"lifecycle\" if \"lifecycle\" in cols else None)\n                )\n                if case_col is None or act_col is None or ts_col is None:\n                    print(f\"Missing required columns in {fn}, skipping.\")\n                    continue\n                out = pd.DataFrame(\n                    {\n                        \"case_id\": df[case_col].astype(str).values,\n                        \"activity\": df[act_col].astype(str).values,\n                        \"timestamp\": pd.to_datetime(df[ts_col], utc=True),\n                    }\n                )\n                if life_col is not None:\n                    out[\"lifecycle\"] = df[life_col].astype(str).values\n                name = os.path.splitext(fn)[0]\n                datasets[name] = out\n                print(\n                    f\"Loaded {name}: {len(out)} events, {out['case_id'].nunique()} cases\"\n                )\n            except Exception as e:\n                print(f\"Failed to load {fn}: {e}\")\n    return datasets\n\n\n# --------- Prefix building and split ----------\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        mask = df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")\n        if mask.any():\n            df = df[mask]\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        if len(g) < 2:\n            continue\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        ts = (g_ts.astype(\"int64\") // 10**9).to_numpy(np.int64)\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str)], dtype=np.int64\n        )\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": acts_ids[:k].tolist(),\n                    \"seq_feats\": feats[:k].copy(),\n                    \"target\": int(acts_ids[k]),\n                    \"prefix_len\": k,\n                }\n            )\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    for s in samples:\n        pass  # initial no norm; will norm on train split\n    return samples, act2id, id2act, pad_id\n\n\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.vstack(\n            [\n                np.zeros((pad_len, self.num_cont), dtype=np.float32),\n                feats.astype(np.float32),\n            ]\n        )\n        attn = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad).long(),\n            \"feats\": torch.tensor(feats_pad).float(),\n            \"mask\": torch.tensor(attn).float(),\n            \"y\": torch.tensor(s[\"target\"]).long(),\n            \"prefix_len\": L,\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, pad_idx=0):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim, hidden_size=hidden, batch_first=True\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h = self.dropout(h[-1])\n        return self.fc(h)\n\n\ndef collate_fn(batch):\n    out = {\n        k: (\n            torch.stack([b[k] for b in batch], 0)\n            if isinstance(batch[0][k], torch.Tensor)\n            else [b[k] for b in batch]\n        )\n        for k in batch[0].keys()\n    }\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys = []\n    yhat = []\n    probs_list = []\n    n = 0\n    top3_correct = 0\n    pref_lens = []\n    top3_flags = []\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) if isinstance(v, torch.Tensor) else v\n                for k, v in batch.items()\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk = torch.topk(probs, k=k_val, dim=1)\n            y = batch[\"y\"]\n            ys.extend(y.detach().cpu().tolist())\n            yhat.extend(top1.detach().cpu().tolist())\n            probs_list.append(probs.detach().cpu().numpy())\n            for i in range(y.size(0)):\n                flag = int(y[i].item() in topk[i].detach().cpu().tolist())\n                top3_correct += flag\n                top3_flags.append(flag)\n                pref_lens.append(int(batch[\"prefix_len\"][i].item()))\n            n += y.size(0)\n    avg_loss = total_loss / max(1, n)\n    y_true = np.array(ys)\n    y_pred = np.array(yhat)\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n))\n    probs_concat = (\n        np.concatenate(probs_list, axis=0)\n        if len(probs_list) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return (\n        avg_loss,\n        acc,\n        f1,\n        top3,\n        y_true,\n        y_pred,\n        probs_concat,\n        np.array(pref_lens),\n        np.array(top3_flags),\n    )\n\n\ndef train_on_dataset(\n    name, df, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n):\n    print(f\"\\n=== Dataset: {name} ===\")\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    s_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    s_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    s_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # normalize time features on train\n    if len(s_train) > 0:\n        feats = np.concatenate(\n            [s[\"seq_feats\"] for s in s_train if len(s[\"seq_feats\"]) > 0], axis=0\n        )\n        dt_mean, dt_std = feats[:, 0].mean(), feats[:, 0].std() + 1e-6\n        ss_mean, ss_std = feats[:, 1].mean(), feats[:, 1].std() + 1e-6\n\n        def norm(samples):\n            for s in samples:\n                if s[\"seq_feats\"].shape[0] > 0:\n                    s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                    s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n        norm(s_train)\n        norm(s_val)\n        norm(s_test)\n    print(\n        f\"Samples train/val/test: {len(s_train)}/{len(s_val)}/{len(s_test)}; vocab={len(act2id)}\"\n    )\n    if len(s_train) == 0 or len(act2id) < 2:\n        print(\"Insufficient data; skipping.\")\n        return None\n    ds_tr = PrefixDataset(s_train, pad_id, max_prefix_len, 5)\n    ds_va = PrefixDataset(s_val, pad_id, max_prefix_len, 5)\n    ds_te = PrefixDataset(s_test, pad_id, max_prefix_len, 5)\n    dl_tr = DataLoader(\n        ds_tr, batch_size=batch_size, shuffle=True, collate_fn=collate_fn\n    )\n    dl_va = DataLoader(\n        ds_va, batch_size=batch_size, shuffle=False, collate_fn=collate_fn\n    )\n    dl_te = DataLoader(\n        ds_te, batch_size=batch_size, shuffle=False, collate_fn=collate_fn\n    )\n    model = LSTMBaseline(\n        vocab_size=len(act2id), emb_dim=64, cont_dim=5, hidden=128, pad_idx=pad_id\n    ).to(device)\n    crit = nn.CrossEntropyLoss().to(device)\n    opt = torch.optim.Adam(model.parameters(), lr=lr)\n    best_top3 = -1.0\n    best_state = None\n    history = {\"train_loss\": [], \"val_loss\": [], \"val_top3\": []}\n    for ep in range(1, max_epochs + 1):\n        model.train()\n        tot = 0\n        run_loss = 0.0\n        for batch in dl_tr:\n            batch = {\n                k: v.to(device) if isinstance(v, torch.Tensor) else v\n                for k, v in batch.items()\n            }\n            opt.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = crit(logits, batch[\"y\"])\n            loss.backward()\n            opt.step()\n            run_loss += loss.item() * logits.size(0)\n            tot += logits.size(0)\n        tr_loss = run_loss / max(1, tot)\n        va_loss, va_acc, va_f1, va_top3, *_ = evaluate(\n            model, dl_va, crit, device, len(act2id), pad_id\n        )\n        print(\n            f\"Epoch {ep}: val_loss={va_loss:.4f} acc={va_acc:.4f} f1={va_f1:.4f} top3={va_top3:.4f}\"\n        )\n        history[\"train_loss\"].append(tr_loss)\n        history[\"val_loss\"].append(va_loss)\n        history[\"val_top3\"].append(va_top3)\n        if va_top3 > best_top3:\n            best_top3 = va_top3\n            best_state = {\n                k: v.detach().cpu().clone() for k, v in model.state_dict().items()\n            }\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n    tr_loss, tr_acc, tr_f1, tr_top3, *_ = evaluate(\n        model, dl_tr, crit, device, len(act2id), pad_id\n    )\n    te_loss, te_acc, te_f1, te_top3, y_true, y_pred, probs, pref_lens, top3_flags = (\n        evaluate(model, dl_te, crit, device, len(act2id), pad_id)\n    )\n    print(\n        f\"[{name}] Test: loss={te_loss:.4f} acc={te_acc:.4f} f1={te_f1:.4f} top3={te_top3:.4f}\"\n    )\n    # package experiment data\n    exp = {\n        \"metrics\": {\n            \"train\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": tr_loss,\n                        \"acc\": tr_acc,\n                        \"macro_f1\": tr_f1,\n                        \"top3\": tr_top3,\n                    },\n                )\n            ],\n            \"val\": [],\n            \"test\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": te_loss,\n                        \"acc\": te_acc,\n                        \"macro_f1\": te_f1,\n                        \"top3\": te_top3,\n                    },\n                )\n            ],\n        },\n        \"losses\": {\n            \"train\": list(enumerate(history[\"train_loss\"], start=1)),\n            \"val\": list(enumerate(history[\"val_loss\"], start=1)),\n        },\n        \"predictions\": y_pred.tolist(),\n        \"ground_truth\": y_true.tolist(),\n        \"epochs\": list(range(1, len(history[\"train_loss\"]) + 1)),\n        \"probs\": probs,\n        \"prefix_lens\": pref_lens.tolist(),\n        \"top3_flags\": top3_flags.tolist(),\n        \"act2id\": act2id,\n    }\n    # plots for this dataset\n    try:\n        plt.figure()\n        plt.plot(history[\"train_loss\"], label=\"train\")\n        plt.plot(history[\"val_loss\"], label=\"val\")\n        plt.legend()\n        plt.title(f\"Loss Curves - {name}\")\n        plt.xlabel(\"Epoch\")\n        plt.ylabel(\"Loss\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"{name}_loss_curves.png\"))\n        plt.close()\n    except Exception as e:\n        print(f\"Error creating loss curves for {name}: {e}\")\n        plt.close()\n    try:\n        cm = confusion_matrix(y_true, y_pred)\n        plt.figure(figsize=(5, 4))\n        plt.imshow(cm, aspect=\"auto\", cmap=\"Blues\")\n        plt.colorbar()\n        plt.title(f\"Confusion Matrix (Test) - {name}\\nNext-activity\")\n        plt.xlabel(\"Predicted\")\n        plt.ylabel(\"True\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"{name}_confusion_matrix.png\"))\n        plt.close()\n    except Exception as e:\n        print(f\"Error creating confusion matrix for {name}: {e}\")\n        plt.close()\n    try:\n        # Top-3 accuracy vs prefix length\n        if len(pref_lens) > 0:\n            d = defaultdict(list)\n            for L, flag in zip(pref_lens, top3_flags):\n                d[int(L)].append(int(flag))\n            xs = sorted(d.keys())\n            ys = [np.mean(d[k]) for k in xs]\n            plt.figure()\n            plt.plot(xs, ys, marker=\"o\")\n            plt.title(f\"Top-3 Accuracy vs Prefix Length - {name}\\nNext-activity\")\n            plt.xlabel(\"Prefix Length\")\n            plt.ylabel(\"Top-3 Accuracy\")\n            plt.tight_layout()\n            plt.savefig(os.path.join(working_dir, f\"{name}_top3_vs_prefixlen.png\"))\n            plt.close()\n    except Exception as e:\n        print(f\"Error creating Top-3 vs prefix length for {name}: {e}\")\n        plt.close()\n    try:\n        # Macro PR curve (one-vs-rest); may be coarse due to many classes\n        if probs.shape[0] > 0:\n            classes = np.unique(y_true)\n            Y = label_binarize(y_true, classes=range(probs.shape[1]))\n            # only keep columns present in classes to avoid PAD\n            present = [c for c in classes]\n            if len(present) > 1:\n                precisions = []\n                recalls = []\n                aps = []\n                for c in present:\n                    p, r, _ = precision_recall_curve(Y[:, c], probs[:, c])\n                    ap = average_precision_score(Y[:, c], probs[:, c])\n                    precisions.append(\n                        np.interp(np.linspace(0, 1, 101), r[::-1], p[::-1])\n                    )\n                    recalls.append(np.linspace(0, 1, 101))\n                    aps.append(ap)\n                macro_p = np.mean(np.stack(precisions, 0), 0)\n                macro_r = np.linspace(0, 1, 101)\n                plt.figure()\n                plt.plot(macro_r, macro_p, label=f\"Macro-PR (mAP={np.mean(aps):.3f})\")\n                plt.title(f\"Macro Precision-Recall (Test) - {name}\\nNext-activity\")\n                plt.xlabel(\"Recall\")\n                plt.ylabel(\"Precision\")\n                plt.legend()\n                plt.tight_layout()\n                plt.savefig(os.path.join(working_dir, f\"{name}_macro_pr.png\"))\n                plt.close()\n    except Exception as e:\n        print(f\"Error creating PR curve for {name}: {e}\")\n        plt.close()\n    return name, exp\n\n\ndef main():\n    datasets = load_xes_folder(data_dir=os.path.join(os.getcwd(), \"data\"))\n    experiment_data = {}\n    for name, df in datasets.items():\n        # optional cap earliest 5000 cases\n        try:\n            starts = (\n                df.sort_values(\"timestamp\")\n                .groupby(\"case_id\")[\"timestamp\"]\n                .min()\n                .reset_index()\n            )\n            if len(starts) > 5000:\n                keep = set(starts.iloc[:5000][\"case_id\"])\n                df = df[df[\"case_id\"].isin(keep)].copy()\n        except:\n            pass\n        res = train_on_dataset(\n            name, df, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n        )\n        if res is not None:\n            k, exp = res\n            experiment_data[k] = exp\n    # Save experiment data\n    np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n    # Print evaluation metrics\n    for k, v in experiment_data.items():\n        test_metrics = dict(v[\"metrics\"][\"test\"][0][1])\n        print(\n            f\"{k} | Test acc={test_metrics['acc']:.4f} macro_f1={test_metrics['macro_f1']:.4f} top3={test_metrics['top3']:.4f} loss={test_metrics['loss']:.4f}\"\n        )\n\n    # Secondary plotting pass strictly from experiment_data.npy (as required)\n    try:\n        experiment_data_loaded = np.load(\n            os.path.join(working_dir, \"experiment_data.npy\"), allow_pickle=True\n        ).item()\n    except Exception as e:\n        print(f\"Error loading experiment data: {e}\")\n        experiment_data_loaded = {}\n    for name, ed in experiment_data_loaded.items():\n        try:\n            # re-plot loss curves from saved data\n            plt.figure()\n            tl = [y for (_, y) in ed.get(\"losses\", {}).get(\"train\", [])]\n            vl = [y for (_, y) in ed.get(\"losses\", {}).get(\"val\", [])]\n            if len(tl) > 0:\n                plt.plot(tl, label=\"train\")\n            if len(vl) > 0:\n                plt.plot(vl, label=\"val\")\n            plt.legend()\n            plt.title(f\"Loss Curves - {name}\\nNext-activity\")\n            plt.xlabel(\"Epoch\")\n            plt.ylabel(\"Loss\")\n            plt.tight_layout()\n            plt.savefig(os.path.join(working_dir, f\"{name}_loss_curves_reload.png\"))\n            plt.close()\n        except Exception as e:\n            print(f\"Error creating plot1: {e}\")\n            plt.close()\n        try:\n            # confusion matrix from predictions and ground truth\n            y_true = ed.get(\"ground_truth\", [])\n            y_pred = ed.get(\"predictions\", [])\n            if len(y_true) > 0 and len(y_pred) > 0:\n                cm = confusion_matrix(y_true, y_pred)\n                plt.figure(figsize=(5, 4))\n                plt.imshow(cm, aspect=\"auto\", cmap=\"Blues\")\n                plt.colorbar()\n                plt.title(f\"Confusion Matrix (Test) - {name}\\nNext-activity\")\n                plt.xlabel(\"Predicted\")\n                plt.ylabel(\"True\")\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(working_dir, f\"{name}_confusion_matrix_reload.png\")\n                )\n                plt.close()\n        except Exception as e:\n            print(f\"Error creating plot2: {e}\")\n            plt.close()\n        try:\n            # Top-3 vs prefix length if present\n            pref = ed.get(\"prefix_lens\", [])\n            flags = ed.get(\"top3_flags\", [])\n            if len(pref) > 0 and len(flags) > 0:\n                d = defaultdict(list)\n                for L, f in zip(pref, flags):\n                    d[int(L)].append(int(f))\n                xs = sorted(d.keys())\n                ys = [float(np.mean(d[x])) for x in xs]\n                plt.figure()\n                plt.plot(xs, ys, marker=\"o\")\n                plt.title(f\"Top-3 Accuracy vs Prefix Length - {name}\\nNext-activity\")\n                plt.xlabel(\"Prefix Length\")\n                plt.ylabel(\"Top-3 Accuracy\")\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(working_dir, f\"{name}_top3_vs_prefixlen_reload.png\")\n                )\n                plt.close()\n        except Exception as e:\n            print(f\"Error creating plot3: {e}\")\n            plt.close()\n        try:\n            # Macro PR curve if probs available\n            probs = np.array(ed.get(\"probs\", []))\n            y_true = ed.get(\"ground_truth\", [])\n            if probs.size > 0 and len(y_true) > 0:\n                classes = sorted(set(y_true))\n                Y = label_binarize(np.array(y_true), classes=range(probs.shape[1]))\n                present = classes\n                if len(present) > 1:\n                    precisions = []\n                    aps = []\n                    grid = np.linspace(0, 1, 101)\n                    for c in present:\n                        p, r, _ = precision_recall_curve(Y[:, c], probs[:, c])\n                        precisions.append(np.interp(grid, r[::-1], p[::-1]))\n                        aps.append(average_precision_score(Y[:, c], probs[:, c]))\n                    macro_p = np.mean(np.stack(precisions, 0), 0)\n                    plt.figure()\n                    plt.plot(grid, macro_p, label=f\"mAP={np.mean(aps):.3f}\")\n                    plt.title(f\"Macro Precision-Recall (Test) - {name}\\nNext-activity\")\n                    plt.xlabel(\"Recall\")\n                    plt.ylabel(\"Precision\")\n                    plt.legend()\n                    plt.tight_layout()\n                    plt.savefig(\n                        os.path.join(working_dir, f\"{name}_macro_pr_reload.png\")\n                    )\n                    plt.close()\n        except Exception as e:\n            print(f\"Error creating plot4: {e}\")\n            plt.close()\n\n\nif __name__ == \"__main__\":\n    main()\n","plot_plan":null,"step":11,"id":"57ccd5de0de34674be3985e9f94220ad","ctime":1757762453.9824324,"_term_out":["Using device: cuda","\n","[data] Using discovered data dir: /workspace/data","\n","[data] Available in /workspace/data: ['BPI_Challenge_2012.xes', 'BPI_Challenge_2017.xes', 'Road_Traffic_Fine_Management_Process.xes']","\n","[data] Loading XES: /workspace/data/BPI_Challenge_2012.xes","\n","\rparsing log, completed traces ::   0%|          | 0/13087 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 1/13087 [00:00<22:10,  9.84it/s]","\rparsing log, completed traces ::   1%|1         | 157/13087 [00:00<00:14, 915.39it/s]","\rparsing log, completed traces ::   2%|2         | 315/13087 [00:00<00:10, 1217.67it/s]","\rparsing log, completed traces ::   4%|3         | 480/13087 [00:00<00:09, 1387.18it/s]","\rparsing log, completed traces ::   5%|4         | 648/13087 [00:00<00:08, 1492.01it/s]","\rparsing log, completed traces ::   6%|6         | 831/13087 [00:00<00:07, 1604.97it/s]","\rparsing log, completed traces ::   8%|7         | 999/13087 [00:00<00:07, 1629.37it/s]","\rparsing log, completed traces ::   9%|8         | 1163/13087 [00:00<00:07, 1629.07it/s]","\rparsing log, completed traces ::  10%|#         | 1343/13087 [00:00<00:06, 1682.09it/s]","\rparsing log, completed traces ::  12%|#1        | 1553/13087 [00:01<00:06, 1803.79it/s]","\rparsing log, completed traces ::  13%|#3        | 1734/13087 [00:01<00:06, 1758.44it/s]","\rparsing log, completed traces ::  15%|#4        | 1911/13087 [00:01<00:06, 1721.46it/s]","\rparsing log, completed traces ::  16%|#5        | 2084/13087 [00:01<00:06, 1690.74it/s]","\rparsing log, completed traces ::  17%|#7        | 2254/13087 [00:01<00:06, 1673.17it/s]","\rparsing log, completed traces ::  19%|#8        | 2440/13087 [00:01<00:06, 1726.21it/s]","\rparsing log, completed traces ::  20%|#9        | 2613/13087 [00:01<00:12, 855.50it/s] ","\rparsing log, completed traces ::  21%|##1       | 2770/13087 [00:02<00:10, 978.32it/s]","\rparsing log, completed traces ::  22%|##2       | 2925/13087 [00:02<00:09, 1090.76it/s]","\rparsing log, completed traces ::  24%|##3       | 3080/13087 [00:02<00:08, 1190.36it/s]","\rparsing log, completed traces ::  25%|##5       | 3292/13087 [00:02<00:06, 1412.02it/s]","\rparsing log, completed traces ::  27%|##6       | 3516/13087 [00:02<00:05, 1621.07it/s]","\rparsing log, completed traces ::  28%|##8       | 3706/13087 [00:02<00:05, 1694.21it/s]","\rparsing log, completed traces ::  30%|##9       | 3892/13087 [00:02<00:05, 1684.67it/s]","\rparsing log, completed traces ::  32%|###1      | 4138/13087 [00:02<00:04, 1898.07it/s]","\rparsing log, completed traces ::  33%|###3      | 4377/13087 [00:02<00:04, 2032.00it/s]","\rparsing log, completed traces ::  35%|###5      | 4589/13087 [00:02<00:04, 2057.20it/s]","\rparsing log, completed traces ::  37%|###6      | 4801/13087 [00:03<00:04, 1981.41it/s]","\rparsing log, completed traces ::  38%|###8      | 5008/13087 [00:03<00:04, 2006.55it/s]","\rparsing log, completed traces ::  40%|###9      | 5212/13087 [00:03<00:04, 1909.01it/s]","\rparsing log, completed traces ::  41%|####1     | 5406/13087 [00:03<00:04, 1876.14it/s]","\rparsing log, completed traces ::  43%|####2     | 5596/13087 [00:03<00:04, 1740.65it/s]","\rparsing log, completed traces ::  44%|####4     | 5785/13087 [00:03<00:04, 1778.71it/s]","\rparsing log, completed traces ::  46%|####5     | 5966/13087 [00:04<00:08, 847.16it/s] ","\rparsing log, completed traces ::  47%|####6     | 6118/13087 [00:04<00:07, 952.69it/s]","\rparsing log, completed traces ::  48%|####8     | 6323/13087 [00:04<00:05, 1154.89it/s]","\rparsing log, completed traces ::  50%|####9     | 6515/13087 [00:04<00:05, 1310.58it/s]","\rparsing log, completed traces ::  51%|#####1    | 6684/13087 [00:04<00:04, 1378.98it/s]","\rparsing log, completed traces ::  52%|#####2    | 6853/13087 [00:04<00:04, 1454.64it/s]","\rparsing log, completed traces ::  54%|#####3    | 7020/13087 [00:04<00:04, 1447.24it/s]","\rparsing log, completed traces ::  55%|#####4    | 7188/13087 [00:04<00:03, 1503.55it/s]","\rparsing log, completed traces ::  56%|#####6    | 7351/13087 [00:04<00:03, 1526.85it/s]","\rparsing log, completed traces ::  57%|#####7    | 7512/13087 [00:05<00:03, 1538.94it/s]","\rparsing log, completed traces ::  59%|#####8    | 7672/13087 [00:05<00:03, 1547.00it/s]","\rparsing log, completed traces ::  60%|#####9    | 7852/13087 [00:05<00:03, 1618.39it/s]","\rparsing log, completed traces ::  61%|######1   | 8018/13087 [00:05<00:03, 1548.13it/s]","\rparsing log, completed traces ::  63%|######2   | 8206/13087 [00:05<00:02, 1637.73it/s]","\rparsing log, completed traces ::  64%|######4   | 8386/13087 [00:05<00:02, 1679.30it/s]","\rparsing log, completed traces ::  65%|######5   | 8571/13087 [00:05<00:02, 1727.80it/s]","\rparsing log, completed traces ::  67%|######6   | 8746/13087 [00:05<00:02, 1713.85it/s]","\rparsing log, completed traces ::  68%|######8   | 8919/13087 [00:05<00:02, 1658.40it/s]","\rparsing log, completed traces ::  69%|######9   | 9086/13087 [00:06<00:02, 1640.60it/s]","\rparsing log, completed traces ::  71%|#######   | 9258/13087 [00:06<00:02, 1662.23it/s]","\rparsing log, completed traces ::  72%|#######2  | 9433/13087 [00:06<00:02, 1686.99it/s]","\rparsing log, completed traces ::  73%|#######3  | 9603/13087 [00:06<00:04, 711.12it/s] ","\rparsing log, completed traces ::  75%|#######4  | 9760/13087 [00:06<00:03, 839.99it/s]","\rparsing log, completed traces ::  76%|#######5  | 9935/13087 [00:07<00:03, 998.10it/s]","\rparsing log, completed traces ::  77%|#######7  | 10092/13087 [00:07<00:02, 1112.68it/s]","\rparsing log, completed traces ::  78%|#######8  | 10242/13087 [00:07<00:02, 1177.22it/s]","\rparsing log, completed traces ::  80%|#######9  | 10409/13087 [00:07<00:02, 1293.23it/s]","\rparsing log, completed traces ::  81%|########  | 10562/13087 [00:07<00:01, 1317.46it/s]","\rparsing log, completed traces ::  82%|########2 | 10735/13087 [00:07<00:01, 1420.82it/s]","\rparsing log, completed traces ::  84%|########3 | 10935/13087 [00:07<00:01, 1571.30it/s]","\rparsing log, completed traces ::  85%|########4 | 11108/13087 [00:07<00:01, 1614.57it/s]","\rparsing log, completed traces ::  86%|########6 | 11291/13087 [00:07<00:01, 1672.81it/s]","\rparsing log, completed traces ::  88%|########7 | 11498/13087 [00:07<00:00, 1782.60it/s]","\rparsing log, completed traces ::  89%|########9 | 11681/13087 [00:08<00:00, 1781.45it/s]","\rparsing log, completed traces ::  91%|######### | 11881/13087 [00:08<00:00, 1837.08it/s]","\rparsing log, completed traces ::  92%|#########2| 12069/13087 [00:08<00:00, 1843.33it/s]","\rparsing log, completed traces ::  94%|#########3| 12285/13087 [00:08<00:00, 1933.30it/s]","\rparsing log, completed traces ::  95%|#########5| 12485/13087 [00:08<00:00, 1944.42it/s]","\rparsing log, completed traces ::  97%|#########6| 12688/13087 [00:08<00:00, 1969.28it/s]","\rparsing log, completed traces ::  98%|#########8| 12886/13087 [00:08<00:00, 1969.51it/s]","","\rparsing log, completed traces :: 100%|##########| 13087/13087 [00:08<00:00, 1498.01it/s]","\n","[data] Loading XES: /workspace/data/BPI_Challenge_2017.xes","\n","\rparsing log, completed traces ::   0%|          | 0/31509 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 1/31509 [00:00<4:45:12,  1.84it/s]","\rparsing log, completed traces ::   0%|          | 68/31509 [00:00<03:44, 140.11it/s]","\rparsing log, completed traces ::   0%|          | 124/31509 [00:00<02:13, 235.86it/s]","\rparsing log, completed traces ::   1%|          | 190/31509 [00:00<01:32, 339.45it/s]","\rparsing log, completed traces ::   1%|          | 252/31509 [00:00<01:15, 411.82it/s]","\rparsing log, completed traces ::   1%|          | 309/31509 [00:01<02:06, 245.67it/s]","\rparsing log, completed traces ::   1%|1         | 370/31509 [00:01<01:40, 308.45it/s]","\rparsing log, completed traces ::   1%|1         | 435/31509 [00:01<01:22, 375.78it/s]","\rparsing log, completed traces ::   2%|1         | 497/31509 [00:01<01:12, 428.95it/s]","\rparsing log, completed traces ::   2%|1         | 556/31509 [00:01<01:06, 467.08it/s]","\rparsing log, completed traces ::   2%|1         | 621/31509 [00:01<01:00, 512.93it/s]","\rparsing log, completed traces ::   2%|2         | 693/31509 [00:01<00:54, 566.72it/s]","\rparsing log, completed traces ::   2%|2         | 758/31509 [00:02<00:52, 588.27it/s]","\rparsing log, completed traces ::   3%|2         | 822/31509 [00:02<00:51, 592.77it/s]","\rparsing log, completed traces ::   3%|2         | 885/31509 [00:02<00:51, 598.13it/s]","\rparsing log, completed traces ::   3%|3         | 958/31509 [00:02<00:48, 633.23it/s]","\rparsing log, completed traces ::   3%|3         | 1026/31509 [00:02<00:47, 644.60it/s]","\rparsing log, completed traces ::   3%|3         | 1092/31509 [00:02<00:48, 628.20it/s]","\rparsing log, completed traces ::   4%|3         | 1158/31509 [00:02<00:47, 636.82it/s]","\rparsing log, completed traces ::   4%|3         | 1228/31509 [00:02<00:46, 653.96it/s]","\rparsing log, completed traces ::   4%|4         | 1295/31509 [00:02<00:46, 655.66it/s]","\rparsing log, completed traces ::   4%|4         | 1365/31509 [00:02<00:45, 667.31it/s]","\rparsing log, completed traces ::   5%|4         | 1433/31509 [00:03<00:45, 654.10it/s]","\rparsing log, completed traces ::   5%|4         | 1499/31509 [00:03<01:33, 320.12it/s]","\rparsing log, completed traces ::   5%|4         | 1566/31509 [00:03<01:19, 378.78it/s]","\rparsing log, completed traces ::   5%|5         | 1632/31509 [00:03<01:09, 431.99it/s]","\rparsing log, completed traces ::   5%|5         | 1694/31509 [00:03<01:03, 470.00it/s]","\rparsing log, completed traces ::   6%|5         | 1760/31509 [00:03<00:57, 513.07it/s]","\rparsing log, completed traces ::   6%|5         | 1821/31509 [00:04<00:56, 530.03it/s]","\rparsing log, completed traces ::   6%|5         | 1881/31509 [00:04<00:54, 546.72it/s]","\rparsing log, completed traces ::   6%|6         | 1947/31509 [00:04<00:51, 577.32it/s]","\rparsing log, completed traces ::   6%|6         | 2012/31509 [00:04<00:49, 593.55it/s]","\rparsing log, completed traces ::   7%|6         | 2076/31509 [00:04<00:48, 604.24it/s]","\rparsing log, completed traces ::   7%|6         | 2142/31509 [00:04<00:47, 619.19it/s]","\rparsing log, completed traces ::   7%|7         | 2208/31509 [00:04<00:46, 628.86it/s]","\rparsing log, completed traces ::   7%|7         | 2278/31509 [00:04<00:45, 649.49it/s]","\rparsing log, completed traces ::   7%|7         | 2344/31509 [00:04<00:45, 645.87it/s]","\rparsing log, completed traces ::   8%|7         | 2410/31509 [00:04<00:44, 649.21it/s]","\rparsing log, completed traces ::   8%|7         | 2476/31509 [00:05<00:44, 650.92it/s]","\rparsing log, completed traces ::   8%|8         | 2544/31509 [00:05<00:43, 658.88it/s]","\rparsing log, completed traces ::   8%|8         | 2619/31509 [00:05<00:42, 685.87it/s]","\rparsing log, completed traces ::   9%|8         | 2688/31509 [00:05<00:42, 684.84it/s]","\rparsing log, completed traces ::   9%|8         | 2757/31509 [00:05<00:43, 667.23it/s]","\rparsing log, completed traces ::   9%|8         | 2830/31509 [00:05<00:42, 682.65it/s]","\rparsing log, completed traces ::   9%|9         | 2899/31509 [00:06<01:29, 320.81it/s]","\rparsing log, completed traces ::   9%|9         | 2970/31509 [00:06<01:14, 384.17it/s]","\rparsing log, completed traces ::  10%|9         | 3039/31509 [00:06<01:04, 442.19it/s]","\rparsing log, completed traces ::  10%|9         | 3103/31509 [00:06<00:58, 483.82it/s]","\rparsing log, completed traces ::  10%|#         | 3171/31509 [00:06<00:53, 528.99it/s]","\rparsing log, completed traces ::  10%|#         | 3235/31509 [00:06<00:51, 552.80it/s]","\rparsing log, completed traces ::  11%|#         | 3309/31509 [00:06<00:46, 601.35it/s]","\rparsing log, completed traces ::  11%|#         | 3382/31509 [00:06<00:44, 635.31it/s]","\rparsing log, completed traces ::  11%|#         | 3459/31509 [00:06<00:41, 672.35it/s]","\rparsing log, completed traces ::  11%|#1        | 3530/31509 [00:06<00:41, 678.91it/s]","\rparsing log, completed traces ::  11%|#1        | 3601/31509 [00:07<00:41, 679.66it/s]","\rparsing log, completed traces ::  12%|#1        | 3672/31509 [00:07<00:40, 686.98it/s]","\rparsing log, completed traces ::  12%|#1        | 3743/31509 [00:07<00:40, 692.76it/s]","\rparsing log, completed traces ::  12%|#2        | 3814/31509 [00:07<00:40, 679.04it/s]","\rparsing log, completed traces ::  12%|#2        | 3883/31509 [00:07<00:40, 679.32it/s]","\rparsing log, completed traces ::  13%|#2        | 3954/31509 [00:07<00:40, 685.63it/s]","\rparsing log, completed traces ::  13%|#2        | 4025/31509 [00:07<00:39, 692.21it/s]","\rparsing log, completed traces ::  13%|#2        | 4095/31509 [00:07<00:39, 688.47it/s]","\rparsing log, completed traces ::  13%|#3        | 4166/31509 [00:07<00:39, 691.25it/s]","\rparsing log, completed traces ::  13%|#3        | 4236/31509 [00:08<00:40, 678.36it/s]","\rparsing log, completed traces ::  14%|#3        | 4304/31509 [00:08<00:40, 670.80it/s]","\rparsing log, completed traces ::  14%|#3        | 4373/31509 [00:08<00:40, 672.93it/s]","\rparsing log, completed traces ::  14%|#4        | 4441/31509 [00:08<01:28, 305.68it/s]","\rparsing log, completed traces ::  14%|#4        | 4509/31509 [00:08<01:14, 363.76it/s]","\rparsing log, completed traces ::  15%|#4        | 4577/31509 [00:08<01:03, 420.82it/s]","\rparsing log, completed traces ::  15%|#4        | 4652/31509 [00:09<00:54, 488.52it/s]","\rparsing log, completed traces ::  15%|#4        | 4725/31509 [00:09<00:49, 542.00it/s]","\rparsing log, completed traces ::  15%|#5        | 4796/31509 [00:09<00:45, 581.34it/s]","\rparsing log, completed traces ::  15%|#5        | 4865/31509 [00:09<00:43, 609.42it/s]","\rparsing log, completed traces ::  16%|#5        | 4933/31509 [00:09<00:42, 623.17it/s]","\rparsing log, completed traces ::  16%|#5        | 5001/31509 [00:09<00:41, 637.95it/s]","\rparsing log, completed traces ::  16%|#6        | 5076/31509 [00:09<00:39, 669.50it/s]","\rparsing log, completed traces ::  16%|#6        | 5147/31509 [00:09<00:38, 680.48it/s]","\rparsing log, completed traces ::  17%|#6        | 5217/31509 [00:09<00:38, 675.60it/s]","\rparsing log, completed traces ::  17%|#6        | 5288/31509 [00:09<00:38, 685.31it/s]","\rparsing log, completed traces ::  17%|#7        | 5358/31509 [00:10<00:38, 681.92it/s]","\rparsing log, completed traces ::  17%|#7        | 5427/31509 [00:10<00:38, 674.27it/s]","\rparsing log, completed traces ::  17%|#7        | 5501/31509 [00:10<00:37, 691.94it/s]","\rparsing log, completed traces ::  18%|#7        | 5575/31509 [00:10<00:36, 705.56it/s]","\rparsing log, completed traces ::  18%|#7        | 5647/31509 [00:10<00:36, 707.85it/s]","\rparsing log, completed traces ::  18%|#8        | 5723/31509 [00:10<00:35, 722.48it/s]","\rparsing log, completed traces ::  18%|#8        | 5796/31509 [00:10<00:35, 714.69it/s]","\rparsing log, completed traces ::  19%|#8        | 5871/31509 [00:10<00:35, 724.52it/s]","\rparsing log, completed traces ::  19%|#8        | 5950/31509 [00:10<00:34, 741.64it/s]","\rparsing log, completed traces ::  19%|#9        | 6025/31509 [00:10<00:35, 714.68it/s]","\rparsing log, completed traces ::  19%|#9        | 6097/31509 [00:11<00:35, 706.55it/s]","\rparsing log, completed traces ::  20%|#9        | 6170/31509 [00:11<00:35, 710.35it/s]","\rparsing log, completed traces ::  20%|#9        | 6242/31509 [00:11<00:35, 712.13it/s]","\rparsing log, completed traces ::  20%|##        | 6314/31509 [00:11<01:25, 295.23it/s]","\rparsing log, completed traces ::  20%|##        | 6389/31509 [00:11<01:09, 362.04it/s]","\rparsing log, completed traces ::  20%|##        | 6456/31509 [00:12<01:00, 414.00it/s]","\rparsing log, completed traces ::  21%|##        | 6524/31509 [00:12<00:53, 465.39it/s]","\rparsing log, completed traces ::  21%|##        | 6588/31509 [00:12<00:50, 494.52it/s]","\rparsing log, completed traces ::  21%|##1       | 6656/31509 [00:12<00:46, 537.27it/s]","\rparsing log, completed traces ::  21%|##1       | 6728/31509 [00:12<00:42, 583.01it/s]","\rparsing log, completed traces ::  22%|##1       | 6796/31509 [00:12<00:40, 607.01it/s]","\rparsing log, completed traces ::  22%|##1       | 6863/31509 [00:12<00:39, 618.11it/s]","\rparsing log, completed traces ::  22%|##2       | 6937/31509 [00:12<00:37, 651.12it/s]","\rparsing log, completed traces ::  22%|##2       | 7006/31509 [00:12<00:37, 656.30it/s]","\rparsing log, completed traces ::  22%|##2       | 7082/31509 [00:13<00:35, 681.47it/s]","\rparsing log, completed traces ::  23%|##2       | 7153/31509 [00:13<00:35, 686.90it/s]","\rparsing log, completed traces ::  23%|##2       | 7223/31509 [00:13<00:36, 666.45it/s]","\rparsing log, completed traces ::  23%|##3       | 7295/31509 [00:13<00:35, 679.57it/s]","\rparsing log, completed traces ::  23%|##3       | 7364/31509 [00:13<00:36, 670.42it/s]","\rparsing log, completed traces ::  24%|##3       | 7432/31509 [00:13<00:35, 672.78it/s]","\rparsing log, completed traces ::  24%|##3       | 7503/31509 [00:13<00:35, 682.51it/s]","\rparsing log, completed traces ::  24%|##4       | 7576/31509 [00:13<00:34, 695.07it/s]","\rparsing log, completed traces ::  24%|##4       | 7646/31509 [00:13<00:34, 682.84it/s]","\rparsing log, completed traces ::  24%|##4       | 7715/31509 [00:13<00:35, 676.95it/s]","\rparsing log, completed traces ::  25%|##4       | 7783/31509 [00:14<00:35, 663.50it/s]","\rparsing log, completed traces ::  25%|##4       | 7854/31509 [00:14<00:35, 675.52it/s]","\rparsing log, completed traces ::  25%|##5       | 7926/31509 [00:14<00:34, 687.91it/s]","\rparsing log, completed traces ::  25%|##5       | 7997/31509 [00:14<00:33, 693.62it/s]","\rparsing log, completed traces ::  26%|##5       | 8067/31509 [00:14<00:34, 687.68it/s]","\rparsing log, completed traces ::  26%|##5       | 8136/31509 [00:14<00:34, 683.31it/s]","\rparsing log, completed traces ::  26%|##6       | 8207/31509 [00:14<00:33, 688.90it/s]","\rparsing log, completed traces ::  26%|##6       | 8276/31509 [00:15<01:28, 263.74it/s]","\rparsing log, completed traces ::  26%|##6       | 8349/31509 [00:15<01:10, 327.73it/s]","\rparsing log, completed traces ::  27%|##6       | 8410/31509 [00:15<01:01, 374.32it/s]","\rparsing log, completed traces ::  27%|##6       | 8481/31509 [00:15<00:52, 438.02it/s]","\rparsing log, completed traces ::  27%|##7       | 8545/31509 [00:15<00:47, 479.58it/s]","\rparsing log, completed traces ::  27%|##7       | 8614/31509 [00:15<00:43, 528.07it/s]","\rparsing log, completed traces ::  28%|##7       | 8681/31509 [00:15<00:40, 560.76it/s]","\rparsing log, completed traces ::  28%|##7       | 8752/31509 [00:16<00:38, 598.85it/s]","\rparsing log, completed traces ::  28%|##7       | 8821/31509 [00:16<00:36, 615.02it/s]","\rparsing log, completed traces ::  28%|##8       | 8888/31509 [00:16<00:36, 626.47it/s]","\rparsing log, completed traces ::  28%|##8       | 8957/31509 [00:16<00:35, 643.23it/s]","\rparsing log, completed traces ::  29%|##8       | 9024/31509 [00:16<00:35, 628.72it/s]","\rparsing log, completed traces ::  29%|##8       | 9090/31509 [00:16<00:35, 637.42it/s]","\rparsing log, completed traces ::  29%|##9       | 9158/31509 [00:16<00:34, 645.61it/s]","\rparsing log, completed traces ::  29%|##9       | 9224/31509 [00:16<00:34, 637.73it/s]","\rparsing log, completed traces ::  29%|##9       | 9289/31509 [00:16<00:34, 635.16it/s]","\rparsing log, completed traces ::  30%|##9       | 9362/31509 [00:16<00:33, 661.55it/s]","\rparsing log, completed traces ::  30%|##9       | 9429/31509 [00:17<00:33, 649.77it/s]","\rparsing log, completed traces ::  30%|###       | 9495/31509 [00:17<00:34, 646.25it/s]","\rparsing log, completed traces ::  30%|###       | 9564/31509 [00:17<00:33, 656.61it/s]","\rparsing log, completed traces ::  31%|###       | 9632/31509 [00:17<00:33, 660.10it/s]","\rparsing log, completed traces ::  31%|###       | 9699/31509 [00:17<00:34, 637.09it/s]","\rparsing log, completed traces ::  31%|###       | 9764/31509 [00:17<00:34, 638.03it/s]","\rparsing log, completed traces ::  31%|###1      | 9829/31509 [00:17<00:33, 640.59it/s]","\rparsing log, completed traces ::  31%|###1      | 9894/31509 [00:17<00:34, 632.83it/s]","\rparsing log, completed traces ::  32%|###1      | 9959/31509 [00:17<00:33, 637.60it/s]","\rparsing log, completed traces ::  32%|###1      | 10023/31509 [00:17<00:33, 636.17it/s]","\rparsing log, completed traces ::  32%|###2      | 10087/31509 [00:18<00:34, 618.69it/s]","\rparsing log, completed traces ::  32%|###2      | 10150/31509 [00:18<00:34, 619.40it/s]","\rparsing log, completed traces ::  32%|###2      | 10219/31509 [00:18<00:33, 637.10it/s]","\rparsing log, completed traces ::  33%|###2      | 10285/31509 [00:18<00:33, 642.50it/s]","\rparsing log, completed traces ::  33%|###2      | 10350/31509 [00:19<01:28, 239.24it/s]","\rparsing log, completed traces ::  33%|###3      | 10414/31509 [00:19<01:11, 293.11it/s]","\rparsing log, completed traces ::  33%|###3      | 10478/31509 [00:19<01:00, 348.76it/s]","\rparsing log, completed traces ::  33%|###3      | 10539/31509 [00:19<00:52, 397.15it/s]","\rparsing log, completed traces ::  34%|###3      | 10605/31509 [00:19<00:46, 451.38it/s]","\rparsing log, completed traces ::  34%|###3      | 10669/31509 [00:19<00:42, 493.29it/s]","\rparsing log, completed traces ::  34%|###4      | 10732/31509 [00:19<00:39, 525.69it/s]","\rparsing log, completed traces ::  34%|###4      | 10794/31509 [00:19<00:38, 534.03it/s]","\rparsing log, completed traces ::  34%|###4      | 10854/31509 [00:19<00:38, 540.63it/s]","\rparsing log, completed traces ::  35%|###4      | 10918/31509 [00:19<00:36, 566.62it/s]","\rparsing log, completed traces ::  35%|###4      | 10980/31509 [00:20<00:35, 580.50it/s]","\rparsing log, completed traces ::  35%|###5      | 11045/31509 [00:20<00:34, 599.39it/s]","\rparsing log, completed traces ::  35%|###5      | 11112/31509 [00:20<00:33, 618.01it/s]","\rparsing log, completed traces ::  35%|###5      | 11177/31509 [00:20<00:32, 626.94it/s]","\rparsing log, completed traces ::  36%|###5      | 11245/31509 [00:20<00:31, 642.33it/s]","\rparsing log, completed traces ::  36%|###5      | 11310/31509 [00:20<00:31, 643.46it/s]","\rparsing log, completed traces ::  36%|###6      | 11375/31509 [00:20<00:31, 629.55it/s]","\rparsing log, completed traces ::  36%|###6      | 11440/31509 [00:20<00:31, 631.70it/s]","\rparsing log, completed traces ::  37%|###6      | 11504/31509 [00:20<00:31, 628.23it/s]","\rparsing log, completed traces ::  37%|###6      | 11569/31509 [00:21<00:31, 628.32it/s]","\rparsing log, completed traces ::  37%|###6      | 11635/31509 [00:21<00:31, 633.87it/s]","\rparsing log, completed traces ::  37%|###7      | 11699/31509 [00:21<00:31, 631.99it/s]","\rparsing log, completed traces ::  37%|###7      | 11767/31509 [00:21<00:30, 643.04it/s]","\rparsing log, completed traces ::  38%|###7      | 11836/31509 [00:21<00:30, 653.14it/s]","\rparsing log, completed traces ::  38%|###7      | 11908/31509 [00:21<00:29, 668.66it/s]","\rparsing log, completed traces ::  38%|###8      | 11979/31509 [00:21<00:28, 678.92it/s]","\rparsing log, completed traces ::  38%|###8      | 12047/31509 [00:21<00:28, 673.93it/s]","\rparsing log, completed traces ::  38%|###8      | 12115/31509 [00:21<00:29, 661.61it/s]","\rparsing log, completed traces ::  39%|###8      | 12182/31509 [00:21<00:29, 651.40it/s]","\rparsing log, completed traces ::  39%|###8      | 12254/31509 [00:22<00:28, 669.77it/s]","\rparsing log, completed traces ::  39%|###9      | 12322/31509 [00:22<00:28, 665.24it/s]","\rparsing log, completed traces ::  39%|###9      | 12389/31509 [00:22<00:28, 665.57it/s]","\rparsing log, completed traces ::  40%|###9      | 12457/31509 [00:22<00:28, 667.75it/s]","\rparsing log, completed traces ::  40%|###9      | 12524/31509 [00:22<00:28, 663.14it/s]","\rparsing log, completed traces ::  40%|###9      | 12591/31509 [00:22<00:28, 657.87it/s]","\rparsing log, completed traces ::  40%|####      | 12658/31509 [00:22<00:28, 656.72it/s]","\rparsing log, completed traces ::  40%|####      | 12724/31509 [00:23<01:23, 224.53it/s]","\rparsing log, completed traces ::  41%|####      | 12787/31509 [00:23<01:08, 275.03it/s]","\rparsing log, completed traces ::  41%|####      | 12850/31509 [00:23<00:56, 328.55it/s]","\rparsing log, completed traces ::  41%|####      | 12914/31509 [00:23<00:48, 383.96it/s]","\rparsing log, completed traces ::  41%|####1     | 12983/31509 [00:23<00:41, 445.96it/s]","\rparsing log, completed traces ::  41%|####1     | 13052/31509 [00:23<00:36, 499.40it/s]","\rparsing log, completed traces ::  42%|####1     | 13124/31509 [00:24<00:33, 552.75it/s]","\rparsing log, completed traces ::  42%|####1     | 13190/31509 [00:24<00:32, 569.42it/s]","\rparsing log, completed traces ::  42%|####2     | 13256/31509 [00:24<00:30, 591.39it/s]","\rparsing log, completed traces ::  42%|####2     | 13323/31509 [00:24<00:29, 612.38it/s]","\rparsing log, completed traces ::  42%|####2     | 13391/31509 [00:24<00:28, 631.03it/s]","\rparsing log, completed traces ::  43%|####2     | 13458/31509 [00:24<00:28, 627.72it/s]","\rparsing log, completed traces ::  43%|####2     | 13526/31509 [00:24<00:28, 640.44it/s]","\rparsing log, completed traces ::  43%|####3     | 13592/31509 [00:24<00:28, 634.47it/s]","\rparsing log, completed traces ::  43%|####3     | 13657/31509 [00:24<00:28, 631.79it/s]","\rparsing log, completed traces ::  44%|####3     | 13723/31509 [00:24<00:27, 638.04it/s]","\rparsing log, completed traces ::  44%|####3     | 13788/31509 [00:25<00:27, 639.85it/s]","\rparsing log, completed traces ::  44%|####3     | 13855/31509 [00:25<00:27, 645.19it/s]","\rparsing log, completed traces ::  44%|####4     | 13921/31509 [00:25<00:27, 648.39it/s]","\rparsing log, completed traces ::  44%|####4     | 13987/31509 [00:25<00:27, 643.74it/s]","\rparsing log, completed traces ::  45%|####4     | 14054/31509 [00:25<00:26, 648.63it/s]","\rparsing log, completed traces ::  45%|####4     | 14121/31509 [00:25<00:26, 652.34it/s]","\rparsing log, completed traces ::  45%|####5     | 14190/31509 [00:25<00:26, 660.23it/s]","\rparsing log, completed traces ::  45%|####5     | 14257/31509 [00:25<00:26, 662.80it/s]","\rparsing log, completed traces ::  45%|####5     | 14325/31509 [00:25<00:25, 667.64it/s]","\rparsing log, completed traces ::  46%|####5     | 14399/31509 [00:25<00:24, 687.15it/s]","\rparsing log, completed traces ::  46%|####5     | 14468/31509 [00:26<00:24, 685.59it/s]","\rparsing log, completed traces ::  46%|####6     | 14537/31509 [00:26<00:25, 661.12it/s]","\rparsing log, completed traces ::  46%|####6     | 14604/31509 [00:26<00:25, 653.98it/s]","\rparsing log, completed traces ::  47%|####6     | 14671/31509 [00:26<00:25, 657.34it/s]","\rparsing log, completed traces ::  47%|####6     | 14740/31509 [00:26<00:25, 665.34it/s]","\rparsing log, completed traces ::  47%|####7     | 14812/31509 [00:26<00:24, 680.74it/s]","\rparsing log, completed traces ::  47%|####7     | 14881/31509 [00:26<00:24, 670.88it/s]","\rparsing log, completed traces ::  47%|####7     | 14956/31509 [00:26<00:23, 694.03it/s]","\rparsing log, completed traces ::  48%|####7     | 15026/31509 [00:26<00:24, 673.48it/s]","\rparsing log, completed traces ::  48%|####7     | 15101/31509 [00:26<00:23, 692.24it/s]","\rparsing log, completed traces ::  48%|####8     | 15171/31509 [00:27<00:23, 692.59it/s]","\rparsing log, completed traces ::  48%|####8     | 15241/31509 [00:27<00:23, 686.87it/s]","\rparsing log, completed traces ::  49%|####8     | 15313/31509 [00:27<00:23, 695.24it/s]","\rparsing log, completed traces ::  49%|####8     | 15385/31509 [00:27<00:22, 701.80it/s]","\rparsing log, completed traces ::  49%|####9     | 15456/31509 [00:28<01:10, 228.49it/s]","\rparsing log, completed traces ::  49%|####9     | 15526/31509 [00:28<00:56, 284.96it/s]","\rparsing log, completed traces ::  50%|####9     | 15597/31509 [00:28<00:45, 347.17it/s]","\rparsing log, completed traces ::  50%|####9     | 15673/31509 [00:28<00:37, 418.15it/s]","\rparsing log, completed traces ::  50%|####9     | 15739/31509 [00:28<00:33, 464.88it/s]","\rparsing log, completed traces ::  50%|#####     | 15808/31509 [00:28<00:30, 514.13it/s]","\rparsing log, completed traces ::  50%|#####     | 15880/31509 [00:28<00:27, 563.08it/s]","\rparsing log, completed traces ::  51%|#####     | 15949/31509 [00:28<00:26, 592.61it/s]","\rparsing log, completed traces ::  51%|#####     | 16017/31509 [00:29<00:25, 615.41it/s]","\rparsing log, completed traces ::  51%|#####1    | 16091/31509 [00:29<00:23, 647.19it/s]","\rparsing log, completed traces ::  51%|#####1    | 16168/31509 [00:29<00:22, 680.33it/s]","\rparsing log, completed traces ::  52%|#####1    | 16240/31509 [00:29<00:22, 688.49it/s]","\rparsing log, completed traces ::  52%|#####1    | 16314/31509 [00:29<00:21, 701.18it/s]","\rparsing log, completed traces ::  52%|#####2    | 16386/31509 [00:29<00:22, 675.29it/s]","\rparsing log, completed traces ::  52%|#####2    | 16455/31509 [00:29<00:22, 669.88it/s]","\rparsing log, completed traces ::  52%|#####2    | 16523/31509 [00:29<00:23, 649.08it/s]","\rparsing log, completed traces ::  53%|#####2    | 16593/31509 [00:29<00:22, 663.22it/s]","\rparsing log, completed traces ::  53%|#####2    | 16665/31509 [00:29<00:21, 678.89it/s]","\rparsing log, completed traces ::  53%|#####3    | 16734/31509 [00:30<00:21, 672.50it/s]","\rparsing log, completed traces ::  53%|#####3    | 16802/31509 [00:30<00:21, 668.72it/s]","\rparsing log, completed traces ::  54%|#####3    | 16875/31509 [00:30<00:21, 684.71it/s]","\rparsing log, completed traces ::  54%|#####3    | 16944/31509 [00:30<00:21, 683.39it/s]","\rparsing log, completed traces ::  54%|#####3    | 17013/31509 [00:30<00:21, 681.32it/s]","\rparsing log, completed traces ::  54%|#####4    | 17087/31509 [00:30<00:20, 695.42it/s]","\rparsing log, completed traces ::  54%|#####4    | 17157/31509 [00:30<00:20, 686.94it/s]","\rparsing log, completed traces ::  55%|#####4    | 17226/31509 [00:30<00:21, 668.23it/s]","\rparsing log, completed traces ::  55%|#####4    | 17298/31509 [00:30<00:20, 681.38it/s]","\rparsing log, completed traces ::  55%|#####5    | 17367/31509 [00:30<00:21, 672.27it/s]","\rparsing log, completed traces ::  55%|#####5    | 17443/31509 [00:31<00:20, 696.94it/s]","\rparsing log, completed traces ::  56%|#####5    | 17513/31509 [00:31<00:21, 662.18it/s]","\rparsing log, completed traces ::  56%|#####5    | 17586/31509 [00:31<00:20, 680.44it/s]","\rparsing log, completed traces ::  56%|#####6    | 17660/31509 [00:31<00:19, 697.17it/s]","\rparsing log, completed traces ::  56%|#####6    | 17731/31509 [00:31<00:19, 689.84it/s]","\rparsing log, completed traces ::  57%|#####6    | 17803/31509 [00:31<00:19, 693.49it/s]","\rparsing log, completed traces ::  57%|#####6    | 17875/31509 [00:31<00:19, 700.64it/s]","\rparsing log, completed traces ::  57%|#####6    | 17946/31509 [00:31<00:19, 694.36it/s]","\rparsing log, completed traces ::  57%|#####7    | 18017/31509 [00:31<00:19, 697.78it/s]","\rparsing log, completed traces ::  57%|#####7    | 18089/31509 [00:32<00:19, 702.79it/s]","\rparsing log, completed traces ::  58%|#####7    | 18160/31509 [00:32<00:18, 704.09it/s]","\rparsing log, completed traces ::  58%|#####7    | 18231/31509 [00:32<00:19, 689.38it/s]","\rparsing log, completed traces ::  58%|#####8    | 18301/31509 [00:32<00:19, 689.90it/s]","\rparsing log, completed traces ::  58%|#####8    | 18371/31509 [00:32<00:19, 678.53it/s]","\rparsing log, completed traces ::  59%|#####8    | 18441/31509 [00:32<00:19, 684.73it/s]","\rparsing log, completed traces ::  59%|#####8    | 18510/31509 [00:32<00:18, 685.95it/s]","\rparsing log, completed traces ::  59%|#####8    | 18579/31509 [00:32<00:19, 662.67it/s]","\rparsing log, completed traces ::  59%|#####9    | 18652/31509 [00:32<00:18, 681.70it/s]","\rparsing log, completed traces ::  59%|#####9    | 18721/31509 [00:33<01:01, 206.40it/s]","\rparsing log, completed traces ::  60%|#####9    | 18789/31509 [00:33<00:49, 259.34it/s]","\rparsing log, completed traces ::  60%|#####9    | 18858/31509 [00:33<00:39, 318.45it/s]","\rparsing log, completed traces ::  60%|######    | 18938/31509 [00:34<00:31, 397.46it/s]","\rparsing log, completed traces ::  60%|######    | 19007/31509 [00:34<00:27, 452.57it/s]","\rparsing log, completed traces ::  61%|######    | 19078/31509 [00:34<00:24, 506.89it/s]","\rparsing log, completed traces ::  61%|######    | 19153/31509 [00:34<00:21, 562.25it/s]","\rparsing log, completed traces ::  61%|######1   | 19223/31509 [00:34<00:21, 583.66it/s]","\rparsing log, completed traces ::  61%|######1   | 19295/31509 [00:34<00:19, 617.97it/s]","\rparsing log, completed traces ::  61%|######1   | 19369/31509 [00:34<00:18, 647.62it/s]","\rparsing log, completed traces ::  62%|######1   | 19444/31509 [00:34<00:17, 674.72it/s]","\rparsing log, completed traces ::  62%|######1   | 19516/31509 [00:34<00:17, 681.20it/s]","\rparsing log, completed traces ::  62%|######2   | 19590/31509 [00:34<00:17, 693.99it/s]","\rparsing log, completed traces ::  62%|######2   | 19662/31509 [00:35<00:17, 694.66it/s]","\rparsing log, completed traces ::  63%|######2   | 19733/31509 [00:35<00:17, 692.70it/s]","\rparsing log, completed traces ::  63%|######2   | 19804/31509 [00:35<00:17, 678.01it/s]","\rparsing log, completed traces ::  63%|######3   | 19873/31509 [00:35<00:17, 679.08it/s]","\rparsing log, completed traces ::  63%|######3   | 19942/31509 [00:35<00:17, 679.76it/s]","\rparsing log, completed traces ::  64%|######3   | 20011/31509 [00:35<00:17, 671.33it/s]","\rparsing log, completed traces ::  64%|######3   | 20080/31509 [00:35<00:16, 676.38it/s]","\rparsing log, completed traces ::  64%|######3   | 20150/31509 [00:35<00:16, 679.81it/s]","\rparsing log, completed traces ::  64%|######4   | 20224/31509 [00:35<00:16, 693.85it/s]","\rparsing log, completed traces ::  64%|######4   | 20298/31509 [00:35<00:15, 703.16it/s]","\rparsing log, completed traces ::  65%|######4   | 20369/31509 [00:36<00:16, 686.04it/s]","\rparsing log, completed traces ::  65%|######4   | 20451/31509 [00:36<00:15, 723.32it/s]","\rparsing log, completed traces ::  65%|######5   | 20524/31509 [00:36<00:15, 717.70it/s]","\rparsing log, completed traces ::  65%|######5   | 20598/31509 [00:36<00:15, 723.86it/s]","\rparsing log, completed traces ::  66%|######5   | 20673/31509 [00:36<00:14, 728.02it/s]","\rparsing log, completed traces ::  66%|######5   | 20747/31509 [00:36<00:14, 727.88it/s]","\rparsing log, completed traces ::  66%|######6   | 20820/31509 [00:36<00:14, 723.42it/s]","\rparsing log, completed traces ::  66%|######6   | 20893/31509 [00:36<00:14, 711.81it/s]","\rparsing log, completed traces ::  67%|######6   | 20965/31509 [00:36<00:15, 696.26it/s]","\rparsing log, completed traces ::  67%|######6   | 21035/31509 [00:37<00:15, 688.19it/s]","\rparsing log, completed traces ::  67%|######6   | 21104/31509 [00:37<00:15, 684.93it/s]","\rparsing log, completed traces ::  67%|######7   | 21173/31509 [00:37<00:15, 680.68it/s]","\rparsing log, completed traces ::  67%|######7   | 21248/31509 [00:37<00:14, 699.05it/s]","\rparsing log, completed traces ::  68%|######7   | 21320/31509 [00:37<00:14, 704.53it/s]","\rparsing log, completed traces ::  68%|######7   | 21391/31509 [00:37<00:14, 692.82it/s]","\rparsing log, completed traces ::  68%|######8   | 21469/31509 [00:37<00:13, 718.23it/s]","\rparsing log, completed traces ::  68%|######8   | 21544/31509 [00:37<00:13, 726.46it/s]","\rparsing log, completed traces ::  69%|######8   | 21617/31509 [00:37<00:13, 715.56it/s]","\rparsing log, completed traces ::  69%|######8   | 21689/31509 [00:37<00:14, 696.88it/s]","\rparsing log, completed traces ::  69%|######9   | 21768/31509 [00:38<00:13, 723.44it/s]","\rparsing log, completed traces ::  69%|######9   | 21843/31509 [00:38<00:13, 729.01it/s]","\rparsing log, completed traces ::  70%|######9   | 21920/31509 [00:38<00:12, 739.90it/s]","\rparsing log, completed traces ::  70%|######9   | 21995/31509 [00:38<00:12, 732.23it/s]","\rparsing log, completed traces ::  70%|#######   | 22071/31509 [00:38<00:12, 738.23it/s]","\rparsing log, completed traces ::  70%|#######   | 22145/31509 [00:38<00:12, 738.27it/s]","\rparsing log, completed traces ::  71%|#######   | 22219/31509 [00:38<00:12, 730.71it/s]","\rparsing log, completed traces ::  71%|#######   | 22293/31509 [00:38<00:12, 733.21it/s]","\rparsing log, completed traces ::  71%|#######   | 22367/31509 [00:38<00:12, 716.71it/s]","\rparsing log, completed traces ::  71%|#######1  | 22439/31509 [00:39<00:46, 196.17it/s]","\rparsing log, completed traces ::  71%|#######1  | 22514/31509 [00:39<00:35, 252.39it/s]","\rparsing log, completed traces ::  72%|#######1  | 22586/31509 [00:40<00:28, 311.61it/s]","\rparsing log, completed traces ::  72%|#######1  | 22657/31509 [00:40<00:23, 372.43it/s]","\rparsing log, completed traces ::  72%|#######2  | 22730/31509 [00:40<00:20, 435.88it/s]","\rparsing log, completed traces ::  72%|#######2  | 22806/31509 [00:40<00:17, 499.44it/s]","\rparsing log, completed traces ::  73%|#######2  | 22879/31509 [00:40<00:15, 549.72it/s]","\rparsing log, completed traces ::  73%|#######2  | 22950/31509 [00:40<00:14, 576.99it/s]","\rparsing log, completed traces ::  73%|#######3  | 23020/31509 [00:40<00:13, 606.52it/s]","\rparsing log, completed traces ::  73%|#######3  | 23089/31509 [00:40<00:13, 626.28it/s]","\rparsing log, completed traces ::  73%|#######3  | 23158/31509 [00:40<00:13, 637.20it/s]","\rparsing log, completed traces ::  74%|#######3  | 23228/31509 [00:41<00:12, 652.53it/s]","\rparsing log, completed traces ::  74%|#######3  | 23297/31509 [00:41<00:12, 659.18it/s]","\rparsing log, completed traces ::  74%|#######4  | 23366/31509 [00:41<00:12, 659.96it/s]","\rparsing log, completed traces ::  74%|#######4  | 23436/31509 [00:41<00:12, 671.36it/s]","\rparsing log, completed traces ::  75%|#######4  | 23505/31509 [00:41<00:11, 673.46it/s]","\rparsing log, completed traces ::  75%|#######4  | 23579/31509 [00:41<00:11, 692.59it/s]","\rparsing log, completed traces ::  75%|#######5  | 23650/31509 [00:41<00:11, 695.44it/s]","\rparsing log, completed traces ::  75%|#######5  | 23721/31509 [00:41<00:11, 696.97it/s]","\rparsing log, completed traces ::  76%|#######5  | 23792/31509 [00:41<00:11, 700.10it/s]","\rparsing log, completed traces ::  76%|#######5  | 23863/31509 [00:41<00:10, 698.49it/s]","\rparsing log, completed traces ::  76%|#######5  | 23933/31509 [00:42<00:10, 694.48it/s]","\rparsing log, completed traces ::  76%|#######6  | 24003/31509 [00:42<00:10, 694.78it/s]","\rparsing log, completed traces ::  76%|#######6  | 24074/31509 [00:42<00:10, 695.87it/s]","\rparsing log, completed traces ::  77%|#######6  | 24144/31509 [00:42<00:10, 697.04it/s]","\rparsing log, completed traces ::  77%|#######6  | 24215/31509 [00:42<00:10, 699.40it/s]","\rparsing log, completed traces ::  77%|#######7  | 24285/31509 [00:42<00:10, 696.93it/s]","\rparsing log, completed traces ::  77%|#######7  | 24359/31509 [00:42<00:10, 706.21it/s]","\rparsing log, completed traces ::  78%|#######7  | 24430/31509 [00:42<00:10, 683.29it/s]","\rparsing log, completed traces ::  78%|#######7  | 24505/31509 [00:42<00:09, 702.46it/s]","\rparsing log, completed traces ::  78%|#######7  | 24577/31509 [00:42<00:09, 705.95it/s]","\rparsing log, completed traces ::  78%|#######8  | 24653/31509 [00:43<00:09, 720.67it/s]","\rparsing log, completed traces ::  78%|#######8  | 24726/31509 [00:43<00:09, 717.78it/s]","\rparsing log, completed traces ::  79%|#######8  | 24798/31509 [00:43<00:09, 713.52it/s]","\rparsing log, completed traces ::  79%|#######8  | 24874/31509 [00:43<00:09, 724.93it/s]","\rparsing log, completed traces ::  79%|#######9  | 24947/31509 [00:43<00:09, 717.88it/s]","\rparsing log, completed traces ::  79%|#######9  | 25025/31509 [00:43<00:08, 734.79it/s]","\rparsing log, completed traces ::  80%|#######9  | 25099/31509 [00:43<00:09, 691.92it/s]","\rparsing log, completed traces ::  80%|#######9  | 25175/31509 [00:43<00:08, 710.25it/s]","\rparsing log, completed traces ::  80%|########  | 25247/31509 [00:43<00:08, 700.15it/s]","\rparsing log, completed traces ::  80%|########  | 25318/31509 [00:44<00:09, 678.34it/s]","\rparsing log, completed traces ::  81%|########  | 25395/31509 [00:44<00:08, 703.55it/s]","\rparsing log, completed traces ::  81%|########  | 25466/31509 [00:44<00:08, 700.32it/s]","\rparsing log, completed traces ::  81%|########1 | 25537/31509 [00:44<00:08, 701.36it/s]","\rparsing log, completed traces ::  81%|########1 | 25610/31509 [00:44<00:08, 706.37it/s]","\rparsing log, completed traces ::  82%|########1 | 25681/31509 [00:44<00:08, 696.28it/s]","\rparsing log, completed traces ::  82%|########1 | 25751/31509 [00:44<00:08, 696.61it/s]","\rparsing log, completed traces ::  82%|########1 | 25821/31509 [00:44<00:08, 677.84it/s]","\rparsing log, completed traces ::  82%|########2 | 25891/31509 [00:44<00:08, 680.20it/s]","\rparsing log, completed traces ::  82%|########2 | 25960/31509 [00:44<00:08, 681.89it/s]","\rparsing log, completed traces ::  83%|########2 | 26029/31509 [00:45<00:08, 672.95it/s]","\rparsing log, completed traces ::  83%|########2 | 26097/31509 [00:45<00:08, 667.31it/s]","\rparsing log, completed traces ::  83%|########3 | 26169/31509 [00:45<00:07, 680.49it/s]","\rparsing log, completed traces ::  83%|########3 | 26239/31509 [00:45<00:07, 685.06it/s]","\rparsing log, completed traces ::  83%|########3 | 26310/31509 [00:45<00:07, 692.08it/s]","\rparsing log, completed traces ::  84%|########3 | 26383/31509 [00:45<00:07, 699.46it/s]","\rparsing log, completed traces ::  84%|########3 | 26453/31509 [00:45<00:07, 692.85it/s]","\rparsing log, completed traces ::  84%|########4 | 26523/31509 [00:46<00:28, 172.11it/s]","\rparsing log, completed traces ::  84%|########4 | 26587/31509 [00:46<00:22, 216.28it/s]","\rparsing log, completed traces ::  85%|########4 | 26653/31509 [00:46<00:18, 269.02it/s]","\rparsing log, completed traces ::  85%|########4 | 26726/31509 [00:47<00:14, 335.56it/s]","\rparsing log, completed traces ::  85%|########5 | 26794/31509 [00:47<00:12, 392.52it/s]","\rparsing log, completed traces ::  85%|########5 | 26863/31509 [00:47<00:10, 449.19it/s]","\rparsing log, completed traces ::  85%|########5 | 26931/31509 [00:47<00:09, 498.84it/s]","\rparsing log, completed traces ::  86%|########5 | 26999/31509 [00:47<00:08, 538.81it/s]","\rparsing log, completed traces ::  86%|########5 | 27065/31509 [00:47<00:07, 561.63it/s]","\rparsing log, completed traces ::  86%|########6 | 27137/31509 [00:47<00:07, 601.87it/s]","\rparsing log, completed traces ::  86%|########6 | 27209/31509 [00:47<00:06, 629.64it/s]","\rparsing log, completed traces ::  87%|########6 | 27283/31509 [00:47<00:06, 658.67it/s]","\rparsing log, completed traces ::  87%|########6 | 27353/31509 [00:48<00:06, 647.22it/s]","\rparsing log, completed traces ::  87%|########7 | 27424/31509 [00:48<00:06, 663.26it/s]","\rparsing log, completed traces ::  87%|########7 | 27493/31509 [00:48<00:06, 667.03it/s]","\rparsing log, completed traces ::  87%|########7 | 27565/31509 [00:48<00:05, 680.69it/s]","\rparsing log, completed traces ::  88%|########7 | 27635/31509 [00:48<00:05, 685.48it/s]","\rparsing log, completed traces ::  88%|########7 | 27709/31509 [00:48<00:05, 701.21it/s]","\rparsing log, completed traces ::  88%|########8 | 27784/31509 [00:48<00:05, 713.47it/s]","\rparsing log, completed traces ::  88%|########8 | 27856/31509 [00:48<00:05, 692.56it/s]","\rparsing log, completed traces ::  89%|########8 | 27926/31509 [00:48<00:05, 681.65it/s]","\rparsing log, completed traces ::  89%|########8 | 27995/31509 [00:48<00:05, 680.48it/s]","\rparsing log, completed traces ::  89%|########9 | 28064/31509 [00:49<00:05, 679.62it/s]","\rparsing log, completed traces ::  89%|########9 | 28133/31509 [00:49<00:05, 672.58it/s]","\rparsing log, completed traces ::  90%|########9 | 28201/31509 [00:49<00:04, 673.42it/s]","\rparsing log, completed traces ::  90%|########9 | 28275/31509 [00:49<00:04, 689.01it/s]","\rparsing log, completed traces ::  90%|########9 | 28344/31509 [00:49<00:04, 682.98it/s]","\rparsing log, completed traces ::  90%|######### | 28413/31509 [00:49<00:04, 679.61it/s]","\rparsing log, completed traces ::  90%|######### | 28484/31509 [00:49<00:04, 685.18it/s]","\rparsing log, completed traces ::  91%|######### | 28553/31509 [00:49<00:04, 685.01it/s]","\rparsing log, completed traces ::  91%|######### | 28627/31509 [00:49<00:04, 699.80it/s]","\rparsing log, completed traces ::  91%|#########1| 28698/31509 [00:49<00:04, 681.58it/s]","\rparsing log, completed traces ::  91%|#########1| 28767/31509 [00:50<00:04, 656.25it/s]","\rparsing log, completed traces ::  92%|#########1| 28833/31509 [00:50<00:04, 646.35it/s]","\rparsing log, completed traces ::  92%|#########1| 28898/31509 [00:50<00:04, 637.31it/s]","\rparsing log, completed traces ::  92%|#########1| 28969/31509 [00:50<00:03, 657.05it/s]","\rparsing log, completed traces ::  92%|#########2| 29037/31509 [00:50<00:03, 659.90it/s]","\rparsing log, completed traces ::  92%|#########2| 29104/31509 [00:50<00:03, 650.53it/s]","\rparsing log, completed traces ::  93%|#########2| 29174/31509 [00:50<00:03, 662.84it/s]","\rparsing log, completed traces ::  93%|#########2| 29244/31509 [00:50<00:03, 668.59it/s]","\rparsing log, completed traces ::  93%|#########3| 29312/31509 [00:50<00:03, 669.89it/s]","\rparsing log, completed traces ::  93%|#########3| 29380/31509 [00:51<00:03, 661.95it/s]","\rparsing log, completed traces ::  93%|#########3| 29447/31509 [00:51<00:03, 649.62it/s]","\rparsing log, completed traces ::  94%|#########3| 29513/31509 [00:51<00:03, 630.45it/s]","\rparsing log, completed traces ::  94%|#########3| 29578/31509 [00:51<00:03, 633.89it/s]","\rparsing log, completed traces ::  94%|#########4| 29651/31509 [00:51<00:02, 660.24it/s]","\rparsing log, completed traces ::  94%|#########4| 29723/31509 [00:51<00:02, 677.55it/s]","\rparsing log, completed traces ::  95%|#########4| 29791/31509 [00:51<00:02, 657.03it/s]","\rparsing log, completed traces ::  95%|#########4| 29858/31509 [00:51<00:02, 659.60it/s]","\rparsing log, completed traces ::  95%|#########4| 29926/31509 [00:51<00:02, 665.36it/s]","\rparsing log, completed traces ::  95%|#########5| 29996/31509 [00:51<00:02, 674.81it/s]","\rparsing log, completed traces ::  95%|#########5| 30064/31509 [00:52<00:02, 659.43it/s]","\rparsing log, completed traces ::  96%|#########5| 30138/31509 [00:52<00:02, 681.84it/s]","\rparsing log, completed traces ::  96%|#########5| 30207/31509 [00:52<00:01, 682.34it/s]","\rparsing log, completed traces ::  96%|#########6| 30279/31509 [00:52<00:01, 689.40it/s]","\rparsing log, completed traces ::  96%|#########6| 30350/31509 [00:52<00:01, 695.16it/s]","\rparsing log, completed traces ::  97%|#########6| 30421/31509 [00:52<00:01, 699.08it/s]","\rparsing log, completed traces ::  97%|#########6| 30491/31509 [00:52<00:01, 693.17it/s]","\rparsing log, completed traces ::  97%|#########6| 30562/31509 [00:52<00:01, 697.46it/s]","\rparsing log, completed traces ::  97%|#########7| 30634/31509 [00:52<00:01, 702.60it/s]","\rparsing log, completed traces ::  97%|#########7| 30705/31509 [00:52<00:01, 701.00it/s]","\rparsing log, completed traces ::  98%|#########7| 30776/31509 [00:53<00:01, 696.86it/s]","\rparsing log, completed traces ::  98%|#########7| 30847/31509 [00:53<00:00, 699.02it/s]","\rparsing log, completed traces ::  98%|#########8| 30917/31509 [00:54<00:03, 159.32it/s]","\rparsing log, completed traces ::  98%|#########8| 30985/31509 [00:54<00:02, 205.03it/s]","\rparsing log, completed traces ::  99%|#########8| 31058/31509 [00:54<00:01, 263.13it/s]","\rparsing log, completed traces ::  99%|#########8| 31129/31509 [00:54<00:01, 323.44it/s]","\rparsing log, completed traces ::  99%|#########9| 31205/31509 [00:54<00:00, 394.55it/s]","\rparsing log, completed traces ::  99%|#########9| 31272/31509 [00:54<00:00, 439.78it/s]","\rparsing log, completed traces ::  99%|#########9| 31338/31509 [00:55<00:00, 481.20it/s]","\rparsing log, completed traces :: 100%|#########9| 31405/31509 [00:55<00:00, 523.53it/s]","\rparsing log, completed traces :: 100%|#########9| 31475/31509 [00:55<00:00, 565.65it/s]","","\rparsing log, completed traces :: 100%|##########| 31509/31509 [00:55<00:00, 570.05it/s]","\n","[data] Loading XES: /workspace/data/Road_Traffic_Fine_Management_Process.xes","\n","\rparsing log, completed traces ::   0%|          | 0/150370 [00:00<?, ?it/s]","\rparsing log, completed traces ::   1%|          | 780/150370 [00:00<00:19, 7793.24it/s]","\rparsing log, completed traces ::   1%|1         | 1619/150370 [00:00<00:18, 8142.98it/s]","\rparsing log, completed traces ::   2%|1         | 2440/150370 [00:00<00:18, 8171.14it/s]","\rparsing log, completed traces ::   2%|2         | 3258/150370 [00:00<00:18, 8168.82it/s]","\rparsing log, completed traces ::   3%|2         | 4089/150370 [00:00<00:17, 8218.08it/s]","\rparsing log, completed traces ::   3%|3         | 4924/150370 [00:00<00:17, 8262.00it/s]","\rparsing log, completed traces ::   4%|3         | 5751/150370 [00:00<00:17, 8231.37it/s]","\rparsing log, completed traces ::   4%|4         | 6575/150370 [00:01<00:34, 4173.47it/s]","\rparsing log, completed traces ::   5%|4         | 7361/150370 [00:01<00:29, 4861.86it/s]","\rparsing log, completed traces ::   5%|5         | 8213/150370 [00:01<00:25, 5626.04it/s]","\rparsing log, completed traces ::   6%|6         | 9104/150370 [00:01<00:22, 6370.30it/s]","\rparsing log, completed traces ::   7%|6         | 9955/150370 [00:01<00:20, 6882.89it/s]","\rparsing log, completed traces ::   7%|7         | 10801/150370 [00:01<00:19, 7294.16it/s]","\rparsing log, completed traces ::   8%|7         | 11635/150370 [00:01<00:18, 7576.35it/s]","\rparsing log, completed traces ::   8%|8         | 12453/150370 [00:01<00:17, 7740.86it/s]","\rparsing log, completed traces ::   9%|8         | 13285/150370 [00:01<00:17, 7883.09it/s]","\rparsing log, completed traces ::   9%|9         | 14105/150370 [00:02<00:17, 7955.48it/s]","\rparsing log, completed traces ::  10%|9         | 14937/150370 [00:02<00:16, 8061.67it/s]","\rparsing log, completed traces ::  11%|#         | 15794/150370 [00:02<00:16, 8208.47it/s]","\rparsing log, completed traces ::  11%|#1        | 16667/150370 [00:02<00:15, 8359.85it/s]","\rparsing log, completed traces ::  12%|#1        | 17537/150370 [00:02<00:15, 8459.84it/s]","\rparsing log, completed traces ::  12%|#2        | 18389/150370 [00:02<00:15, 8467.18it/s]","\rparsing log, completed traces ::  13%|#2        | 19240/150370 [00:02<00:32, 4037.18it/s]","\rparsing log, completed traces ::  13%|#3        | 20081/150370 [00:03<00:27, 4774.52it/s]","\rparsing log, completed traces ::  14%|#3        | 20933/150370 [00:03<00:23, 5500.88it/s]","\rparsing log, completed traces ::  15%|#4        | 21864/150370 [00:03<00:20, 6326.81it/s]","\rparsing log, completed traces ::  15%|#5        | 22771/150370 [00:03<00:18, 6967.41it/s]","\rparsing log, completed traces ::  16%|#5        | 23619/150370 [00:03<00:17, 7348.70it/s]","\rparsing log, completed traces ::  16%|#6        | 24457/150370 [00:03<00:17, 7210.60it/s]","\rparsing log, completed traces ::  17%|#6        | 25251/150370 [00:03<00:17, 7163.85it/s]","\rparsing log, completed traces ::  17%|#7        | 26018/150370 [00:03<00:17, 7055.62it/s]","\rparsing log, completed traces ::  18%|#7        | 26759/150370 [00:03<00:17, 6906.22it/s]","\rparsing log, completed traces ::  18%|#8        | 27474/150370 [00:04<00:17, 6840.31it/s]","\rparsing log, completed traces ::  19%|#8        | 28175/150370 [00:04<00:17, 6881.29it/s]","\rparsing log, completed traces ::  19%|#9        | 28970/150370 [00:04<00:16, 7180.14it/s]","\rparsing log, completed traces ::  20%|#9        | 29779/150370 [00:04<00:16, 7440.47it/s]","\rparsing log, completed traces ::  20%|##        | 30532/150370 [00:04<00:16, 7296.85it/s]","\rparsing log, completed traces ::  21%|##        | 31268/150370 [00:04<00:16, 7171.44it/s]","\rparsing log, completed traces ::  21%|##1       | 31990/150370 [00:04<00:16, 7114.59it/s]","\rparsing log, completed traces ::  22%|##1       | 32705/150370 [00:05<00:36, 3245.47it/s]","\rparsing log, completed traces ::  22%|##2       | 33415/150370 [00:05<00:30, 3851.59it/s]","\rparsing log, completed traces ::  23%|##2       | 34152/150370 [00:05<00:25, 4499.27it/s]","\rparsing log, completed traces ::  23%|##3       | 34850/150370 [00:05<00:23, 5016.25it/s]","\rparsing log, completed traces ::  24%|##3       | 35554/150370 [00:05<00:20, 5480.34it/s]","\rparsing log, completed traces ::  24%|##4       | 36265/150370 [00:05<00:19, 5882.60it/s]","\rparsing log, completed traces ::  25%|##4       | 37000/150370 [00:05<00:18, 6248.74it/s]","\rparsing log, completed traces ::  25%|##5       | 37723/150370 [00:05<00:17, 6505.72it/s]","\rparsing log, completed traces ::  26%|##5       | 38480/150370 [00:05<00:16, 6801.91it/s]","\rparsing log, completed traces ::  26%|##6       | 39242/150370 [00:06<00:15, 7013.92it/s]","\rparsing log, completed traces ::  27%|##6       | 40006/150370 [00:06<00:15, 7194.19it/s]","\rparsing log, completed traces ::  27%|##7       | 40752/150370 [00:06<00:15, 7265.95it/s]","\rparsing log, completed traces ::  28%|##7       | 41543/150370 [00:06<00:14, 7453.90it/s]","\rparsing log, completed traces ::  28%|##8       | 42334/150370 [00:06<00:14, 7588.42it/s]","\rparsing log, completed traces ::  29%|##8       | 43112/150370 [00:06<00:14, 7645.12it/s]","\rparsing log, completed traces ::  29%|##9       | 43882/150370 [00:06<00:13, 7640.82it/s]","\rparsing log, completed traces ::  30%|##9       | 44651/150370 [00:06<00:13, 7629.66it/s]","\rparsing log, completed traces ::  30%|###       | 45417/150370 [00:06<00:13, 7615.24it/s]","\rparsing log, completed traces ::  31%|###       | 46181/150370 [00:06<00:13, 7563.59it/s]","\rparsing log, completed traces ::  31%|###1      | 46939/150370 [00:07<00:13, 7515.73it/s]","\rparsing log, completed traces ::  32%|###1      | 47692/150370 [00:07<00:32, 3128.47it/s]","\rparsing log, completed traces ::  32%|###2      | 48499/150370 [00:07<00:26, 3868.27it/s]","\rparsing log, completed traces ::  33%|###2      | 49365/150370 [00:07<00:21, 4712.35it/s]","\rparsing log, completed traces ::  33%|###3      | 50153/150370 [00:07<00:18, 5348.73it/s]","\rparsing log, completed traces ::  34%|###3      | 50906/150370 [00:08<00:17, 5827.43it/s]","\rparsing log, completed traces ::  34%|###4      | 51682/150370 [00:08<00:15, 6293.52it/s]","\rparsing log, completed traces ::  35%|###4      | 52441/150370 [00:08<00:14, 6625.03it/s]","\rparsing log, completed traces ::  35%|###5      | 53221/150370 [00:08<00:13, 6939.72it/s]","\rparsing log, completed traces ::  36%|###5      | 53989/150370 [00:08<00:13, 7143.96it/s]","\rparsing log, completed traces ::  36%|###6      | 54838/150370 [00:08<00:12, 7524.56it/s]","\rparsing log, completed traces ::  37%|###6      | 55627/150370 [00:08<00:12, 7587.86it/s]","\rparsing log, completed traces ::  38%|###7      | 56452/150370 [00:08<00:12, 7780.05it/s]","\rparsing log, completed traces ::  38%|###8      | 57283/150370 [00:08<00:11, 7934.71it/s]","\rparsing log, completed traces ::  39%|###8      | 58090/150370 [00:08<00:11, 7935.54it/s]","\rparsing log, completed traces ::  39%|###9      | 58893/150370 [00:09<00:11, 7900.42it/s]","\rparsing log, completed traces ::  40%|###9      | 59724/150370 [00:09<00:11, 8020.17it/s]","\rparsing log, completed traces ::  40%|####      | 60531/150370 [00:09<00:11, 7987.25it/s]","\rparsing log, completed traces ::  41%|####      | 61436/150370 [00:09<00:10, 8301.79it/s]","\rparsing log, completed traces ::  41%|####1     | 62328/150370 [00:09<00:10, 8484.93it/s]","\rparsing log, completed traces ::  42%|####2     | 63179/150370 [00:09<00:10, 8376.85it/s]","\rparsing log, completed traces ::  43%|####2     | 64019/150370 [00:09<00:10, 8269.09it/s]","\rparsing log, completed traces ::  43%|####3     | 64848/150370 [00:09<00:10, 8205.82it/s]","\rparsing log, completed traces ::  44%|####3     | 65671/150370 [00:09<00:10, 8211.83it/s]","\rparsing log, completed traces ::  44%|####4     | 66505/150370 [00:09<00:10, 8249.07it/s]","\rparsing log, completed traces ::  45%|####4     | 67331/150370 [00:10<00:26, 3180.21it/s]","\rparsing log, completed traces ::  45%|####5     | 68246/150370 [00:10<00:20, 4019.33it/s]","\rparsing log, completed traces ::  46%|####5     | 69104/150370 [00:10<00:16, 4781.92it/s]","\rparsing log, completed traces ::  46%|####6     | 69911/150370 [00:10<00:14, 5406.01it/s]","\rparsing log, completed traces ::  47%|####7     | 70735/150370 [00:11<00:13, 6014.30it/s]","\rparsing log, completed traces ::  48%|####7     | 71551/150370 [00:11<00:12, 6509.11it/s]","\rparsing log, completed traces ::  48%|####8     | 72361/150370 [00:11<00:11, 6907.65it/s]","\rparsing log, completed traces ::  49%|####8     | 73158/150370 [00:11<00:10, 7114.65it/s]","\rparsing log, completed traces ::  49%|####9     | 73946/150370 [00:11<00:10, 7221.08it/s]","\rparsing log, completed traces ::  50%|####9     | 74895/150370 [00:11<00:09, 7849.43it/s]","\rparsing log, completed traces ::  50%|#####     | 75723/150370 [00:11<00:09, 7923.86it/s]","\rparsing log, completed traces ::  51%|#####     | 76585/150370 [00:11<00:09, 8121.50it/s]","\rparsing log, completed traces ::  51%|#####1    | 77420/150370 [00:11<00:08, 8118.92it/s]","\rparsing log, completed traces ::  52%|#####2    | 78248/150370 [00:11<00:08, 8031.66it/s]","\rparsing log, completed traces ::  53%|#####2    | 79063/150370 [00:12<00:08, 8036.15it/s]","\rparsing log, completed traces ::  53%|#####3    | 79875/150370 [00:12<00:08, 7969.83it/s]","\rparsing log, completed traces ::  54%|#####3    | 80680/150370 [00:12<00:08, 7969.13it/s]","\rparsing log, completed traces ::  54%|#####4    | 81481/150370 [00:12<00:08, 7965.81it/s]","\rparsing log, completed traces ::  55%|#####4    | 82337/150370 [00:12<00:08, 8132.84it/s]","\rparsing log, completed traces ::  55%|#####5    | 83200/150370 [00:12<00:08, 8280.25it/s]","\rparsing log, completed traces ::  56%|#####5    | 84030/150370 [00:12<00:08, 8255.61it/s]","\rparsing log, completed traces ::  56%|#####6    | 84857/150370 [00:12<00:08, 8173.29it/s]","\rparsing log, completed traces ::  57%|#####6    | 85676/150370 [00:12<00:07, 8109.71it/s]","\rparsing log, completed traces ::  58%|#####7    | 86500/150370 [00:12<00:07, 8124.51it/s]","\rparsing log, completed traces ::  58%|#####8    | 87334/150370 [00:13<00:07, 8175.58it/s]","\rparsing log, completed traces ::  59%|#####8    | 88163/150370 [00:13<00:07, 8208.28it/s]","\rparsing log, completed traces ::  59%|#####9    | 88993/150370 [00:13<00:07, 8211.60it/s]","\rparsing log, completed traces ::  60%|#####9    | 89815/150370 [00:13<00:20, 2907.03it/s]","\rparsing log, completed traces ::  60%|######    | 90649/150370 [00:14<00:16, 3618.04it/s]","\rparsing log, completed traces ::  61%|######    | 91485/150370 [00:14<00:13, 4358.79it/s]","\rparsing log, completed traces ::  61%|######1   | 92319/150370 [00:14<00:11, 5081.60it/s]","\rparsing log, completed traces ::  62%|######1   | 93141/150370 [00:14<00:09, 5724.85it/s]","\rparsing log, completed traces ::  62%|######2   | 93976/150370 [00:14<00:08, 6315.39it/s]","\rparsing log, completed traces ::  63%|######3   | 94851/150370 [00:14<00:08, 6904.52it/s]","\rparsing log, completed traces ::  64%|######3   | 95702/150370 [00:14<00:07, 7320.32it/s]","\rparsing log, completed traces ::  64%|######4   | 96527/150370 [00:14<00:07, 7551.70it/s]","\rparsing log, completed traces ::  65%|######4   | 97350/150370 [00:14<00:06, 7735.88it/s]","\rparsing log, completed traces ::  65%|######5   | 98173/150370 [00:14<00:06, 7870.73it/s]","\rparsing log, completed traces ::  66%|######5   | 99005/150370 [00:15<00:06, 8000.27it/s]","\rparsing log, completed traces ::  66%|######6   | 99830/150370 [00:15<00:06, 8036.82it/s]","\rparsing log, completed traces ::  67%|######6   | 100654/150370 [00:15<00:06, 8094.42it/s]","\rparsing log, completed traces ::  67%|######7   | 101486/150370 [00:15<00:05, 8159.00it/s]","\rparsing log, completed traces ::  68%|######8   | 102321/150370 [00:15<00:05, 8215.44it/s]","\rparsing log, completed traces ::  69%|######8   | 103149/150370 [00:15<00:05, 8179.69it/s]","\rparsing log, completed traces ::  69%|######9   | 103972/150370 [00:15<00:05, 8145.77it/s]","\rparsing log, completed traces ::  70%|######9   | 104790/150370 [00:15<00:05, 8072.56it/s]","\rparsing log, completed traces ::  70%|#######   | 105600/150370 [00:15<00:05, 8042.89it/s]","\rparsing log, completed traces ::  71%|#######   | 106413/150370 [00:15<00:05, 8067.79it/s]","\rparsing log, completed traces ::  71%|#######1  | 107221/150370 [00:16<00:05, 7998.77it/s]","\rparsing log, completed traces ::  72%|#######1  | 108027/150370 [00:16<00:05, 8016.33it/s]","\rparsing log, completed traces ::  72%|#######2  | 108830/150370 [00:16<00:05, 7967.95it/s]","\rparsing log, completed traces ::  73%|#######2  | 109632/150370 [00:16<00:05, 7983.05it/s]","\rparsing log, completed traces ::  73%|#######3  | 110431/150370 [00:16<00:05, 7963.79it/s]","\rparsing log, completed traces ::  74%|#######3  | 111228/150370 [00:16<00:04, 7964.54it/s]","\rparsing log, completed traces ::  75%|#######4  | 112032/150370 [00:16<00:04, 7986.67it/s]","\rparsing log, completed traces ::  75%|#######5  | 112831/150370 [00:16<00:04, 7911.76it/s]","\rparsing log, completed traces ::  76%|#######5  | 113667/150370 [00:16<00:04, 8044.19it/s]","\rparsing log, completed traces ::  76%|#######6  | 114645/150370 [00:17<00:04, 8560.60it/s]","\rparsing log, completed traces ::  77%|#######6  | 115502/150370 [00:17<00:12, 2776.65it/s]","\rparsing log, completed traces ::  77%|#######7  | 116472/150370 [00:17<00:09, 3617.67it/s]","\rparsing log, completed traces ::  78%|#######8  | 117514/150370 [00:18<00:07, 4623.64it/s]","\rparsing log, completed traces ::  79%|#######8  | 118340/150370 [00:18<00:06, 5166.74it/s]","\rparsing log, completed traces ::  79%|#######9  | 119144/150370 [00:18<00:05, 5647.30it/s]","\rparsing log, completed traces ::  80%|#######9  | 119931/150370 [00:18<00:05, 6044.63it/s]","\rparsing log, completed traces ::  80%|########  | 120704/150370 [00:18<00:04, 6379.54it/s]","\rparsing log, completed traces ::  81%|########  | 121468/150370 [00:18<00:04, 6637.35it/s]","\rparsing log, completed traces ::  81%|########1 | 122226/150370 [00:18<00:04, 6882.39it/s]","\rparsing log, completed traces ::  82%|########1 | 122983/150370 [00:18<00:03, 7053.22it/s]","\rparsing log, completed traces ::  82%|########2 | 123738/150370 [00:18<00:03, 7170.58it/s]","\rparsing log, completed traces ::  83%|########2 | 124491/150370 [00:18<00:03, 7188.14it/s]","\rparsing log, completed traces ::  83%|########3 | 125235/150370 [00:19<00:03, 7257.98it/s]","\rparsing log, completed traces ::  84%|########3 | 125994/150370 [00:19<00:03, 7352.33it/s]","\rparsing log, completed traces ::  84%|########4 | 126761/150370 [00:19<00:03, 7445.36it/s]","\rparsing log, completed traces ::  85%|########4 | 127517/150370 [00:19<00:03, 7468.70it/s]","\rparsing log, completed traces ::  85%|########5 | 128284/150370 [00:19<00:02, 7527.41it/s]","\rparsing log, completed traces ::  86%|########5 | 129068/150370 [00:19<00:02, 7620.25it/s]","\rparsing log, completed traces ::  86%|########6 | 129848/150370 [00:19<00:02, 7672.53it/s]","\rparsing log, completed traces ::  87%|########6 | 130627/150370 [00:19<00:02, 7683.94it/s]","\rparsing log, completed traces ::  87%|########7 | 131404/150370 [00:19<00:02, 7702.31it/s]","\rparsing log, completed traces ::  88%|########7 | 132317/150370 [00:19<00:02, 8128.25it/s]","\rparsing log, completed traces ::  89%|########8 | 133172/150370 [00:20<00:02, 8253.23it/s]","\rparsing log, completed traces ::  89%|########9 | 133999/150370 [00:20<00:01, 8207.94it/s]","\rparsing log, completed traces ::  90%|########9 | 134821/150370 [00:20<00:01, 8070.92it/s]","\rparsing log, completed traces ::  90%|######### | 135629/150370 [00:20<00:01, 7972.84it/s]","\rparsing log, completed traces ::  91%|######### | 136428/150370 [00:20<00:01, 7848.00it/s]","\rparsing log, completed traces ::  91%|#########1| 137214/150370 [00:20<00:01, 7797.18it/s]","\rparsing log, completed traces ::  92%|#########1| 137995/150370 [00:20<00:01, 7714.13it/s]","\rparsing log, completed traces ::  92%|#########2| 138770/150370 [00:20<00:01, 7719.44it/s]","\rparsing log, completed traces ::  93%|#########2| 139546/150370 [00:20<00:01, 7719.89it/s]","\rparsing log, completed traces ::  93%|#########3| 140333/150370 [00:20<00:01, 7763.00it/s]","\rparsing log, completed traces ::  94%|#########3| 141133/150370 [00:21<00:01, 7832.42it/s]","\rparsing log, completed traces ::  94%|#########4| 141953/150370 [00:21<00:01, 7921.39it/s]","\rparsing log, completed traces ::  95%|#########4| 142746/150370 [00:21<00:00, 7859.84it/s]","\rparsing log, completed traces ::  95%|#########5| 143533/150370 [00:21<00:00, 7861.77it/s]","\rparsing log, completed traces ::  96%|#########5| 144320/150370 [00:22<00:02, 2310.13it/s]","\rparsing log, completed traces ::  96%|#########6| 145048/150370 [00:22<00:01, 2862.14it/s]","\rparsing log, completed traces ::  97%|#########6| 145696/150370 [00:22<00:01, 3356.72it/s]","\rparsing log, completed traces ::  97%|#########7| 146326/150370 [00:22<00:01, 3822.20it/s]","\rparsing log, completed traces ::  98%|#########7| 146953/150370 [00:22<00:00, 4275.30it/s]","\rparsing log, completed traces ::  98%|#########8| 147593/150370 [00:22<00:00, 4725.51it/s]","\rparsing log, completed traces ::  99%|#########8| 148228/150370 [00:22<00:00, 5096.31it/s]","\rparsing log, completed traces ::  99%|#########9| 148899/150370 [00:22<00:00, 5498.16it/s]","\rparsing log, completed traces ::  99%|#########9| 149575/150370 [00:23<00:00, 5828.73it/s]","\rparsing log, completed traces :: 100%|#########9| 150313/150370 [00:23<00:00, 6249.51it/s]","","\rparsing log, completed traces :: 100%|##########| 150370/150370 [00:23<00:00, 6484.11it/s]","\n","[data] Loaded datasets: ['BPI2012', 'BPI2017', 'ROAD']","\n","\n=== Dataset: BPI2012 ===","\n","Samples train/val/test: 22252/4176/4196; vocab=23","\n","Epoch 1: validation_loss = 0.5594 | val_acc=0.7409 | val_f1=0.5316 | val_top3=0.9840","\n","Epoch 2: validation_loss = 0.5308 | val_acc=0.7598 | val_f1=0.5425 | val_top3=0.9854","\n","Epoch 3: validation_loss = 0.5333 | val_acc=0.7574 | val_f1=0.5725 | val_top3=0.9859","\n","Epoch 4: validation_loss = 0.5195 | val_acc=0.7629 | val_f1=0.5835 | val_top3=0.9861","\n","Epoch 5: validation_loss = 0.5221 | val_acc=0.7450 | val_f1=0.6007 | val_top3=0.9854","\n","Epoch 6: validation_loss = 0.5249 | val_acc=0.7634 | val_f1=0.5833 | val_top3=0.9861","\n","Epoch 7: validation_loss = 0.5073 | val_acc=0.7639 | val_f1=0.5909 | val_top3=0.9856","\n","Epoch 8: validation_loss = 0.5113 | val_acc=0.7593 | val_f1=0.5790 | val_top3=0.9859","\n","Epoch 9: validation_loss = 0.5105 | val_acc=0.7639 | val_f1=0.5842 | val_top3=0.9852","\n","Epoch 10: validation_loss = 0.5201 | val_acc=0.7634 | val_f1=0.5797 | val_top3=0.9847","\n","[BPI2012] Train: loss=0.5148 acc=0.7777 f1=0.5609 top3=0.9868","\n","[BPI2012] Test:  loss=0.5355 acc=0.7569 f1=0.5872 top3=0.9874","\n","\n=== Dataset: BPI2017 ===","\n","Samples train/val/test: 34519/7403/7374; vocab=24","\n","Epoch 1: validation_loss = 0.4172 | val_acc=0.8368 | val_f1=0.5299 | val_top3=0.9904","\n","Epoch 2: validation_loss = 0.4004 | val_acc=0.8367 | val_f1=0.5595 | val_top3=0.9907","\n","Epoch 3: validation_loss = 0.3864 | val_acc=0.8384 | val_f1=0.5719 | val_top3=0.9912","\n","Epoch 4: validation_loss = 0.3847 | val_acc=0.8395 | val_f1=0.5903 | val_top3=0.9919","\n","Epoch 5: validation_loss = 0.3812 | val_acc=0.8405 | val_f1=0.5856 | val_top3=0.9922","\n","Epoch 6: validation_loss = 0.3802 | val_acc=0.8376 | val_f1=0.5896 | val_top3=0.9916","\n","Epoch 7: validation_loss = 0.3769 | val_acc=0.8361 | val_f1=0.5957 | val_top3=0.9924","\n","Epoch 8: validation_loss = 0.3799 | val_acc=0.8386 | val_f1=0.6180 | val_top3=0.9927","\n","Epoch 9: validation_loss = 0.3805 | val_acc=0.8391 | val_f1=0.5989 | val_top3=0.9926","\n","Epoch 10: validation_loss = 0.3756 | val_acc=0.8399 | val_f1=0.6155 | val_top3=0.9928","\n","[BPI2017] Train: loss=0.3607 acc=0.8422 f1=0.5721 top3=0.9941","\n","[BPI2017] Test:  loss=0.3877 acc=0.8332 f1=0.5710 top3=0.9906","\n","\n=== Dataset: ROAD ===","\n","Samples train/val/test: 8707/1928/1869; vocab=11","\n","Epoch 1: validation_loss = 0.4913 | val_acc=0.7993 | val_f1=0.3684 | val_top3=0.9922","\n","Epoch 2: validation_loss = 0.4561 | val_acc=0.8086 | val_f1=0.4514 | val_top3=0.9948","\n","Epoch 3: validation_loss = 0.4566 | val_acc=0.8091 | val_f1=0.5300 | val_top3=0.9969","\n","Epoch 4: validation_loss = 0.4482 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 5: validation_loss = 0.4355 | val_acc=0.8112 | val_f1=0.6427 | val_top3=0.9969","\n","Epoch 6: validation_loss = 0.4334 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 7: validation_loss = 0.4328 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 8: validation_loss = 0.4334 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 9: validation_loss = 0.4274 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 10: validation_loss = 0.4329 | val_acc=0.8122 | val_f1=0.6664 | val_top3=0.9969","\n","[ROAD] Train: loss=0.4662 acc=0.7894 f1=0.5395 top3=0.9986","\n","[ROAD] Test:  loss=0.4833 acc=0.8020 f1=0.4740 top3=0.9936","\n","Execution time: 3 minutes seconds (time limit is an hour)."],"parse_metrics_plan":"I will load the numpy file from the specified working directory, parse the nested experiment_data structure, and compute final or best metrics as requested. For training and test, I will report the final metrics saved in the structure. For validation, I will compute the best values across epochs for accuracy, F1 score, and top-3 accuracy, and the minimum validation loss using the recorded loss history. The script prints the dataset name followed by clearly labeled metrics and executes immediately.","parse_metrics_code":"import os\nimport numpy as np\n\n\ndef safe_get(d, *keys, default=None):\n    cur = d\n    for k in keys:\n        if isinstance(cur, dict) and k in cur:\n            cur = cur[k]\n        else:\n            return default\n    return cur\n\n\ndef load_experiment_data():\n    working_dir = os.path.join(os.getcwd(), \"working\")\n    path = os.path.join(working_dir, \"experiment_data.npy\")\n    if not os.path.isfile(path):\n        raise FileNotFoundError(f\"File not found: {path}\")\n    data = np.load(path, allow_pickle=True).item()\n    if not isinstance(data, dict):\n        raise ValueError(\"Loaded experiment_data is not a dict.\")\n    return data\n\n\ndef extract_final_train_metrics(ds_data):\n    # Expect a 'final' entry\n    train_entries = safe_get(ds_data, \"metrics\", \"train\", default=[])\n    final = None\n    for tag, vals in train_entries:\n        if tag == \"final\":\n            final = vals\n    out = {}\n    if final:\n        out[\"train loss\"] = final.get(\"loss\", None)\n        out[\"train accuracy\"] = final.get(\"acc\", None)\n        out[\"train F1 score\"] = final.get(\"macro_f1\", None)\n        out[\"train top-3 accuracy\"] = final.get(\"top3\", None)\n    else:\n        # Fallback: try last value from losses for loss only\n        train_losses = safe_get(ds_data, \"losses\", \"train\", default=[])\n        if train_losses:\n            out[\"train loss\"] = train_losses[-1][1]\n    return out\n\n\ndef extract_best_val_metrics(ds_data):\n    # Collect per-epoch validation metrics (acc, macro_f1, top3)\n    val_entries = safe_get(ds_data, \"metrics\", \"val\", default=[])\n    best = {\n        \"validation accuracy\": None,\n        \"validation F1 score\": None,\n        \"validation top-3 accuracy\": None,\n    }\n    for tag, vals in val_entries:\n        if isinstance(vals, dict):\n            acc = vals.get(\"acc\", None)\n            f1 = vals.get(\"macro_f1\", None)\n            top3 = vals.get(\"top3\", None)\n            if acc is not None:\n                best[\"validation accuracy\"] = (\n                    acc\n                    if best[\"validation accuracy\"] is None\n                    else max(best[\"validation accuracy\"], acc)\n                )\n            if f1 is not None:\n                best[\"validation F1 score\"] = (\n                    f1\n                    if best[\"validation F1 score\"] is None\n                    else max(best[\"validation F1 score\"], f1)\n                )\n            if top3 is not None:\n                best[\"validation top-3 accuracy\"] = (\n                    top3\n                    if best[\"validation top-3 accuracy\"] is None\n                    else max(best[\"validation top-3 accuracy\"], top3)\n                )\n    # For validation loss, use recorded losses per epoch and take the minimum\n    val_losses = safe_get(ds_data, \"losses\", \"val\", default=[])\n    if val_losses:\n        min_val_loss = min((v for (_, v) in val_losses), default=None)\n    else:\n        # fallback: check 'final' val entry if present\n        min_val_loss = None\n        for tag, vals in val_entries:\n            if tag == \"final\" and isinstance(vals, dict):\n                min_val_loss = vals.get(\"loss\", None)\n                break\n    out = {\"validation loss\": min_val_loss}\n    out.update(best)\n    return out\n\n\ndef extract_final_test_metrics(ds_data):\n    test_entries = safe_get(ds_data, \"metrics\", \"test\", default=[])\n    final = None\n    for tag, vals in test_entries:\n        if tag == \"final\":\n            final = vals\n    out = {}\n    if final:\n        out[\"test loss\"] = final.get(\"loss\", None)\n        out[\"test accuracy\"] = final.get(\"acc\", None)\n        out[\"test F1 score\"] = final.get(\"macro_f1\", None)\n        out[\"test top-3 accuracy\"] = final.get(\"top3\", None)\n    return out\n\n\ndef format_print_metrics(dataset_name, metrics_dict):\n    print(dataset_name)\n    # Keep a consistent order for readability\n    ordered_keys = [\n        \"train loss\",\n        \"train accuracy\",\n        \"train F1 score\",\n        \"train top-3 accuracy\",\n        \"validation loss\",\n        \"validation accuracy\",\n        \"validation F1 score\",\n        \"validation top-3 accuracy\",\n        \"test loss\",\n        \"test accuracy\",\n        \"test F1 score\",\n        \"test top-3 accuracy\",\n    ]\n    printed_any = False\n    for k in ordered_keys:\n        if k in metrics_dict and metrics_dict[k] is not None:\n            val = metrics_dict[k]\n            if isinstance(val, float):\n                print(f\"{k}: {val:.4f}\")\n            else:\n                print(f\"{k}: {val}\")\n            printed_any = True\n    # Print any remaining keys that were not in the ordered list\n    for k, v in metrics_dict.items():\n        if k not in ordered_keys and v is not None:\n            if isinstance(v, float):\n                print(f\"{k}: {v:.4f}\")\n            else:\n                print(f\"{k}: {v}\")\n            printed_any = True\n    if not printed_any:\n        print(\"No metrics available\")\n\n\ndef run():\n    experiment_data = load_experiment_data()\n    for ds_name, ds_data in experiment_data.items():\n        all_metrics = {}\n        all_metrics.update(extract_final_train_metrics(ds_data))\n        all_metrics.update(extract_best_val_metrics(ds_data))\n        all_metrics.update(extract_final_test_metrics(ds_data))\n        format_print_metrics(ds_name, all_metrics)\n\n\n# Execute immediately\nrun()\n","parse_term_out":["BPI2012","\n","train loss: 0.5148","\n","train accuracy: 0.7777","\n","train F1 score: 0.5609","\n","train top-3 accuracy: 0.9868","\n","validation loss: 0.5073","\n","validation accuracy: 0.7639","\n","validation F1 score: 0.6007","\n","validation top-3 accuracy: 0.9861","\n","test loss: 0.5355","\n","test accuracy: 0.7569","\n","test F1 score: 0.5872","\n","test top-3 accuracy: 0.9874","\n","BPI2017","\n","train loss: 0.3607","\n","train accuracy: 0.8422","\n","train F1 score: 0.5721","\n","train top-3 accuracy: 0.9941","\n","validation loss: 0.3756","\n","validation accuracy: 0.8405","\n","validation F1 score: 0.6180","\n","validation top-3 accuracy: 0.9928","\n","test loss: 0.3877","\n","test accuracy: 0.8332","\n","test F1 score: 0.5710","\n","test top-3 accuracy: 0.9906","\n","ROAD","\n","train loss: 0.4662","\n","train accuracy: 0.7894","\n","train F1 score: 0.5395","\n","train top-3 accuracy: 0.9986","\n","validation loss: 0.4274","\n","validation accuracy: 0.8122","\n","validation F1 score: 0.6664","\n","validation top-3 accuracy: 0.9969","\n","test loss: 0.4833","\n","test accuracy: 0.8020","\n","test F1 score: 0.4740","\n","test top-3 accuracy: 0.9936","\n","Execution time: a moment seconds (time limit is an hour)."],"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":236.745676279068,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"","exp_results_dir":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839","metric":{"value":{"metric_names":[{"metric_name":"train loss","lower_is_better":true,"description":"Cross-entropy loss on the training split; lower indicates better fit.","data":[{"dataset_name":"BPI2012","final_value":0.5148,"best_value":0.5148},{"dataset_name":"BPI2017","final_value":0.3607,"best_value":0.3607},{"dataset_name":"ROAD","final_value":0.4662,"best_value":0.4662}]},{"metric_name":"train accuracy","lower_is_better":false,"description":"Classification accuracy on the training split; higher is better.","data":[{"dataset_name":"BPI2012","final_value":0.7777,"best_value":0.7777},{"dataset_name":"BPI2017","final_value":0.8422,"best_value":0.8422},{"dataset_name":"ROAD","final_value":0.7894,"best_value":0.7894}]},{"metric_name":"train F1 score","lower_is_better":false,"description":"F1 score on the training split; harmonic mean of precision and recall.","data":[{"dataset_name":"BPI2012","final_value":0.5609,"best_value":0.5609},{"dataset_name":"BPI2017","final_value":0.5721,"best_value":0.5721},{"dataset_name":"ROAD","final_value":0.5395,"best_value":0.5395}]},{"metric_name":"train top-3 accuracy","lower_is_better":false,"description":"Top-3 accuracy on the training split; prediction is correct if the true label is among the top 3 predictions.","data":[{"dataset_name":"BPI2012","final_value":0.9868,"best_value":0.9868},{"dataset_name":"BPI2017","final_value":0.9941,"best_value":0.9941},{"dataset_name":"ROAD","final_value":0.9986,"best_value":0.9986}]},{"metric_name":"validation loss","lower_is_better":true,"description":"Cross-entropy loss on the validation split; lower indicates better generalization.","data":[{"dataset_name":"BPI2012","final_value":0.5073,"best_value":0.5073},{"dataset_name":"BPI2017","final_value":0.3756,"best_value":0.3756},{"dataset_name":"ROAD","final_value":0.4274,"best_value":0.4274}]},{"metric_name":"validation accuracy","lower_is_better":false,"description":"Classification accuracy on the validation split; higher is better.","data":[{"dataset_name":"BPI2012","final_value":0.7639,"best_value":0.7639},{"dataset_name":"BPI2017","final_value":0.8405,"best_value":0.8405},{"dataset_name":"ROAD","final_value":0.8122,"best_value":0.8122}]},{"metric_name":"validation F1 score","lower_is_better":false,"description":"F1 score on the validation split; harmonic mean of precision and recall.","data":[{"dataset_name":"BPI2012","final_value":0.6007,"best_value":0.6007},{"dataset_name":"BPI2017","final_value":0.618,"best_value":0.618},{"dataset_name":"ROAD","final_value":0.6664,"best_value":0.6664}]},{"metric_name":"validation top-3 accuracy","lower_is_better":false,"description":"Top-3 accuracy on the validation split; prediction is correct if the true label is among the top 3 predictions.","data":[{"dataset_name":"BPI2012","final_value":0.9861,"best_value":0.9861},{"dataset_name":"BPI2017","final_value":0.9928,"best_value":0.9928},{"dataset_name":"ROAD","final_value":0.9969,"best_value":0.9969}]},{"metric_name":"test loss","lower_is_better":true,"description":"Cross-entropy loss on the test split; lower indicates better generalization.","data":[{"dataset_name":"BPI2012","final_value":0.5355,"best_value":0.5355},{"dataset_name":"BPI2017","final_value":0.3877,"best_value":0.3877},{"dataset_name":"ROAD","final_value":0.4833,"best_value":0.4833}]},{"metric_name":"test accuracy","lower_is_better":false,"description":"Classification accuracy on the test split; higher is better.","data":[{"dataset_name":"BPI2012","final_value":0.7569,"best_value":0.7569},{"dataset_name":"BPI2017","final_value":0.8332,"best_value":0.8332},{"dataset_name":"ROAD","final_value":0.802,"best_value":0.802}]},{"metric_name":"test F1 score","lower_is_better":false,"description":"F1 score on the test split; harmonic mean of precision and recall.","data":[{"dataset_name":"BPI2012","final_value":0.5872,"best_value":0.5872},{"dataset_name":"BPI2017","final_value":0.571,"best_value":0.571},{"dataset_name":"ROAD","final_value":0.474,"best_value":0.474}]},{"metric_name":"test top-3 accuracy","lower_is_better":false,"description":"Top-3 accuracy on the test split; prediction is correct if the true label is among the top 3 predictions.","data":[{"dataset_name":"BPI2012","final_value":0.9874,"best_value":0.9874},{"dataset_name":"BPI2017","final_value":0.9906,"best_value":0.9906},{"dataset_name":"ROAD","final_value":0.9936,"best_value":0.9936}]}]},"maximize":null,"name":null,"description":null},"is_buggy":false,"is_buggy_plots":false,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":["../../logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/val_top3_BPI2017.png","../../logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/val_top3_BPI2012.png","../../logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/loss_curves_ROAD.png","../../logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/loss_curves_BPI2017.png","../../logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/val_top3_ROAD.png","../../logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/loss_curves_BPI2012.png"],"plot_paths":["experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/val_top3_BPI2017.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/val_top3_BPI2012.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/loss_curves_ROAD.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/loss_curves_BPI2017.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/val_top3_ROAD.png","experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/loss_curves_BPI2012.png"],"plot_analyses":[{"analysis":"The validation Top-3 Accuracy for BPI2017 shows a consistent improvement over the epochs, indicating that the model is learning effectively and improving its prediction capability for the next activities in the process. This suggests that the tuned hyperparameters are effective for this dataset, as the accuracy continues to increase without signs of overfitting.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/val_top3_BPI2017.png"},{"analysis":"For BPI2012, the validation Top-3 Accuracy initially increases rapidly but then shows fluctuations. The accuracy peaks around epoch 3-4, followed by a slight decrease. This could indicate that the model has reached its learning capacity for the given hyperparameters or that it may benefit from further tuning or regularization to stabilize the performance.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/val_top3_BPI2012.png"},{"analysis":"The loss curves for ROAD demonstrate a significant drop in both training and validation loss within the initial epochs, stabilizing towards the end. This suggests that the model is converging well with minimal overfitting, as the training and validation losses are closely aligned. The rapid decrease in loss is promising for the model's predictive performance.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/loss_curves_ROAD.png"},{"analysis":"In BPI2017, the loss curves show a similar pattern to ROAD, with a sharp decline initially followed by stabilization. This indicates effective convergence and suggests that the hyperparameters are well-suited for this dataset, with the model learning efficiently without significant overfitting.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/loss_curves_BPI2017.png"},{"analysis":"Val Top-3 Accuracy for ROAD shows rapid improvement and stabilization, maintaining a high accuracy from epoch 3 onwards. This suggests that the model is very effective for this dataset, achieving strong predictive performance early in the training process. The stability of the accuracy indicates good hyperparameter tuning.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/val_top3_ROAD.png"},{"analysis":"The loss curves for BPI2012 exhibit a sharp decrease initially, with both training and validation loss aligning closely, which is indicative of good convergence. However, towards the end, there is a slight increase in validation loss, which may be a sign of slight overfitting. Additional regularization or further hyperparameter tuning could be explored to address this.","plot_path":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/loss_curves_BPI2012.png"}],"vlm_feedback_summary":"The results indicate that the model's hyperparameter tuning is generally effective across the different datasets, with strong predictive performance and convergence demonstrated. However, some datasets show signs of fluctuation or potential overfitting, suggesting room for further optimization or regularization. Overall, the experiments provide valuable insights into the model's capabilities and areas for improvement.","datasets_successfully_tested":["BPI2017","BPI2012","ROAD"],"ablation_name":null,"hyperparam_name":null,"is_seed_node":true,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"# Set random seed\nimport random\nimport numpy as np\nimport torch\n\nseed = 2\nrandom.seed(seed)\nnp.random.seed(seed)\ntorch.manual_seed(seed)\nif torch.cuda.is_available():\n    torch.cuda.manual_seed(seed)\n\nimport os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\nimport numpy as np\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import f1_score, accuracy_score\nimport random\nimport math\nimport matplotlib.pyplot as plt\n\n# Device handling (required)\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n# Experiment data structure\nexperiment_data = {\n    \"BPI2012\": {\n        \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n        \"losses\": {\"train\": [], \"val\": []},\n        \"predictions\": [],\n        \"ground_truth\": [],\n        \"epochs\": [],\n    },\n    \"BPI2017\": {\n        \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n        \"losses\": {\"train\": [], \"val\": []},\n        \"predictions\": [],\n        \"ground_truth\": [],\n        \"epochs\": [],\n    },\n    \"ROAD\": {\n        \"metrics\": {\"train\": [], \"val\": [], \"test\": []},\n        \"losses\": {\"train\": [], \"val\": []},\n        \"predictions\": [],\n        \"ground_truth\": [],\n        \"epochs\": [],\n    },\n}\n\n# Data loading utilities (use provided helper)\nfrom ai_scientist.ideas.my_research_topic import load_datasets, pick_default_dataset\n\n\n# Reproducibility\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# Build prefixes\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    # Keep only 'complete' transitions if lifecycle exists\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        df = df[df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")]\n        if len(df) == 0:\n            df = df.copy()  # fallback if empty\n            df = df.sort_values([\"case_id\", \"timestamp\"])\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    # Build activity vocab\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}  # 0 for PAD\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        # Convert to numpy arrays for safe positional indexing\n        ts_ns = (\n            pd.to_datetime(g[\"timestamp\"], utc=True).astype(\"int64\").to_numpy()\n        )  # nanoseconds\n        ts = (ts_ns // 10**9).astype(np.int64)  # seconds as numpy array\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str).tolist()], dtype=np.int64\n        )\n        # simple calendar features\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        # time deltas and since start in seconds\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(\n            np.float32\n        )  # [T,5]\n        T = len(acts_ids)\n        if T < 2:\n            continue\n        # Generate prefixes of length k (min_prefix_len..min(max_prefix_len, T-1)); target = activity at position k\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            seq_acts = acts_ids[:k].tolist()\n            seq_feats = feats[:k]\n            target = int(acts_ids[k])\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": seq_acts,\n                    \"seq_feats\": seq_feats.copy(),\n                    \"target\": target,\n                    \"last_ts\": int(ts[k - 1]),\n                    \"next_ts\": int(ts[k]),\n                }\n            )\n\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n\n    # Collect feature normalization stats over all feats (initial; will be recomputed on train split)\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n    ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n    for s in samples:\n        if s[\"seq_feats\"].shape[0] > 0:\n            s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n            s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n    return samples, act2id, id2act, pad_id\n\n\n# Time-based split by case start time\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.zeros((pad_len, self.num_cont), dtype=np.float32)\n        feats_pad = np.vstack([feats_pad, feats.astype(np.float32)])\n        attn_mask = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad, dtype=torch.long),\n            \"feats\": torch.tensor(feats_pad, dtype=torch.float32),\n            \"mask\": torch.tensor(attn_mask, dtype=torch.float32),\n            \"y\": torch.tensor(s[\"target\"], dtype=torch.long),\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(\n        self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, num_layers=1, pad_idx=0\n    ):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim,\n            hidden_size=hidden,\n            batch_first=True,\n            num_layers=num_layers,\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)  # includes PAD index\n        self.pad_idx = pad_idx\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)  # [B,T,emb]\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h_last = h[-1]\n        h_last = self.dropout(h_last)\n        logits = self.fc(h_last)\n        return logits\n\n\ndef collate_fn(batch):\n    keys = batch[0].keys()\n    out = {k: torch.stack([b[k] for b in batch], dim=0) for k in keys}\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys, preds_top1, preds_probs = [], [], []\n    top3_correct = 0\n    n_total = 0\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk_idx = torch.topk(probs, k=k_val, dim=1)\n            ys.extend(batch[\"y\"].detach().cpu().tolist())\n            preds_top1.extend(top1.detach().cpu().tolist())\n            preds_probs.append(probs.detach().cpu().numpy())\n            # top-3 correctness\n            for i in range(batch[\"y\"].size(0)):\n                if batch[\"y\"][i].item() in topk_idx[i].detach().cpu().tolist():\n                    top3_correct += 1\n            n_total += batch[\"y\"].size(0)\n    avg_loss = total_loss / max(1, n_total)\n    y_true = np.array(ys)\n    y_pred = np.array(preds_top1)\n    mask = y_true != pad_idx\n    y_true = y_true[mask]\n    y_pred = y_pred[mask]\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except Exception:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n_total))\n    probs_concat = (\n        np.concatenate(preds_probs, axis=0)\n        if len(preds_probs) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return avg_loss, acc, f1, top3, y_true, y_pred, probs_concat\n\n\ndef train_one_dataset(\n    name, df, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n):\n    print(f\"\\n=== Dataset: {name} ===\")\n    # Time-based split\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    # Build samples across all to get vocab; we'll re-normalize with train stats\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    # Filter per split\n    samples_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    samples_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    samples_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # Recompute normalization using train samples only\n    if len(samples_train) > 0:\n        concat_feats = [\n            s[\"seq_feats\"] for s in samples_train if s[\"seq_feats\"].shape[0] > 0\n        ]\n        if len(concat_feats) > 0:\n            all_feats = np.concatenate(concat_feats, axis=0)\n            dt_mean, dt_std = all_feats[:, 0].mean(), all_feats[:, 0].std() + 1e-6\n            ss_mean, ss_std = all_feats[:, 1].mean(), all_feats[:, 1].std() + 1e-6\n\n            def norm_samples(samples):\n                for s in samples:\n                    if s[\"seq_feats\"].shape[0] > 0:\n                        s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                        s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n            norm_samples(samples_train)\n            norm_samples(samples_val)\n            norm_samples(samples_test)\n    print(\n        f\"Samples train/val/test: {len(samples_train)}/{len(samples_val)}/{len(samples_test)}; vocab={len(act2id)}\"\n    )\n    if len(samples_train) == 0 or len(act2id) < 2:\n        print(\"Not enough data to train. Skipping.\")\n        return\n    ds_train = PrefixDataset(\n        samples_train, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_val = PrefixDataset(\n        samples_val, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    ds_test = PrefixDataset(\n        samples_test, pad_id=pad_id, max_len=max_prefix_len, num_cont=5\n    )\n    dl_train = DataLoader(\n        ds_train,\n        batch_size=batch_size,\n        shuffle=True,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_val = DataLoader(\n        ds_val,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n    dl_test = DataLoader(\n        ds_test,\n        batch_size=batch_size,\n        shuffle=False,\n        collate_fn=collate_fn,\n        num_workers=0,\n    )\n\n    # Model\n    model = LSTMBaseline(\n        vocab_size=len(act2id),\n        emb_dim=64,\n        cont_dim=5,\n        hidden=128,\n        num_layers=1,\n        pad_idx=pad_id,\n    ).to(device)\n    criterion = nn.CrossEntropyLoss().to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    # Training loop\n    best_val_top3 = -1.0\n    best_state = None\n    hist = {\"train_loss\": [], \"val_loss\": [], \"val_top3\": []}\n    for epoch in range(1, max_epochs + 1):\n        model.train()\n        total = 0\n        running_loss = 0.0\n        for batch in dl_train:\n            batch = {\n                k: v.to(device) for k, v in batch.items() if isinstance(v, torch.Tensor)\n            }\n            optimizer.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item() * logits.size(0)\n            total += logits.size(0)\n        train_loss = running_loss / max(1, total)\n        val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n            model, dl_val, criterion, device, len(act2id), pad_id\n        )\n        print(\n            f\"Epoch {epoch}: validation_loss = {val_loss:.4f} | val_acc={val_acc:.4f} | val_f1={val_f1:.4f} | val_top3={val_top3:.4f}\"\n        )\n        hist[\"train_loss\"].append(train_loss)\n        hist[\"val_loss\"].append(val_loss)\n        hist[\"val_top3\"].append(val_top3)\n        experiment_data[name][\"losses\"][\"train\"].append((epoch, train_loss))\n        experiment_data[name][\"losses\"][\"val\"].append((epoch, val_loss))\n        experiment_data[name][\"metrics\"][\"val\"].append(\n            (epoch, {\"acc\": val_acc, \"macro_f1\": val_f1, \"top3\": val_top3})\n        )\n        experiment_data[name][\"epochs\"].append(epoch)\n        if val_top3 > best_val_top3:\n            best_val_top3 = val_top3\n            best_state = {k: v.cpu().clone() for k, v in model.state_dict().items()}\n\n    # Load best\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n\n    # Final eval on train/val/test\n    train_loss, train_acc, train_f1, train_top3, _, _, _ = evaluate(\n        model, dl_train, criterion, device, len(act2id), pad_id\n    )\n    val_loss, val_acc, val_f1, val_top3, _, _, _ = evaluate(\n        model, dl_val, criterion, device, len(act2id), pad_id\n    )\n    test_loss, test_acc, test_f1, test_top3, y_true_t, y_pred_t, probs_t = evaluate(\n        model, dl_test, criterion, device, len(act2id), pad_id\n    )\n    print(\n        f\"[{name}] Train: loss={train_loss:.4f} acc={train_acc:.4f} f1={train_f1:.4f} top3={train_top3:.4f}\"\n    )\n    print(\n        f\"[{name}] Test:  loss={test_loss:.4f} acc={test_acc:.4f} f1={test_f1:.4f} top3={test_top3:.4f}\"\n    )\n\n    # Save metrics\n    experiment_data[name][\"metrics\"][\"train\"].append(\n        (\n            \"final\",\n            {\n                \"loss\": train_loss,\n                \"acc\": train_acc,\n                \"macro_f1\": train_f1,\n                \"top3\": train_top3,\n            },\n        )\n    )\n    experiment_data[name][\"metrics\"][\"val\"].append(\n        (\n            \"final\",\n            {\"loss\": val_loss, \"acc\": val_acc, \"macro_f1\": val_f1, \"top3\": val_top3},\n        )\n    )\n    experiment_data[name][\"metrics\"][\"test\"].append(\n        (\n            \"final\",\n            {\n                \"loss\": test_loss,\n                \"acc\": test_acc,\n                \"macro_f1\": test_f1,\n                \"top3\": test_top3,\n            },\n        )\n    )\n    experiment_data[name][\"predictions\"] = y_pred_t.tolist()\n    experiment_data[name][\"ground_truth\"] = y_true_t.tolist()\n\n    # Plots\n    try:\n        plt.figure()\n        plt.plot(hist[\"train_loss\"], label=\"train_loss\")\n        plt.plot(hist[\"val_loss\"], label=\"val_loss\")\n        plt.legend()\n        plt.title(f\"Loss Curves - {name}\")\n        plt.xlabel(\"Epoch\")\n        plt.ylabel(\"Loss\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"loss_curves_{name}.png\"))\n        plt.close()\n\n        plt.figure()\n        plt.plot(hist[\"val_top3\"], label=\"val_top3\")\n        plt.legend()\n        plt.title(f\"Val Top-3 Acc - {name}\")\n        plt.xlabel(\"Epoch\")\n        plt.ylabel(\"Top-3 Acc\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"val_top3_{name}.png\"))\n        plt.close()\n    except Exception as e:\n        print(f\"[warn] Plotting failed: {e}\")\n\n    # Save confusion matrix-like data (optional)\n    try:\n        from sklearn.metrics import confusion_matrix\n\n        cm = confusion_matrix(y_true_t, y_pred_t)\n        np.save(os.path.join(working_dir, f\"cm_{name}.npy\"), cm)\n    except Exception as e:\n        print(f\"[warn] Confusion matrix failed: {e}\")\n\n\ndef main():\n    datasets = load_datasets()\n    # Loop through loaded datasets; cap to 5000 earliest cases for speed\n    for key, df in datasets.items():\n        try:\n            starts = (\n                df.sort_values(\"timestamp\")\n                .groupby(\"case_id\")[\"timestamp\"]\n                .min()\n                .reset_index()\n            )\n            if len(starts) > 5000:\n                keep_cases = set(starts.iloc[:5000][\"case_id\"])\n                df_small = df[df[\"case_id\"].isin(keep_cases)].copy()\n            else:\n                df_small = df\n        except Exception:\n            df_small = df\n        train_one_dataset(\n            key, df_small, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n        )\n    # Save experiment data\n    np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n    np.savez_compressed(\n        os.path.join(working_dir, \"experiment_data_compressed.npz\"),\n        data=experiment_data,\n    )\n\n\n# Execute immediately\nmain()\n","plan":"Seed node","overall_plan":"","plot_code":"import matplotlib.pyplot as plt\nimport numpy as np\nimport os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\nimport pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nfrom sklearn.metrics import (\n    f1_score,\n    accuracy_score,\n    confusion_matrix,\n    precision_recall_curve,\n    average_precision_score,\n)\nfrom sklearn.preprocessing import label_binarize\nimport random\nimport math\nfrom collections import defaultdict\n\n# Reproducibility and device\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\nprint(f\"Using device: {device}\")\n\n\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n\nset_seed(42)\n\n\n# --------- Data loading from local XES via pm4py ----------\ndef load_xes_folder(data_dir=\"data\"):\n    datasets = {}\n    try:\n        import pm4py\n    except Exception as e:\n        print(f\"pm4py not available: {e}\")\n        return datasets\n    if not os.path.isdir(data_dir):\n        print(f\"Data directory not found: {data_dir}\")\n        return datasets\n    for fn in os.listdir(data_dir):\n        if fn.lower().endswith(\".xes\") or fn.lower().endswith(\".xes.gz\"):\n            path = os.path.join(data_dir, fn)\n            try:\n                log = pm4py.read_xes(path)\n                df = pm4py.convert_to_dataframe(log)\n                # Standardize columns\n                # pm4py dataframe typically has case:concept:name, concept:name, time:timestamp, lifecycle:transition\n                cols = df.columns\n                case_col = (\n                    \"case:concept:name\"\n                    if \"case:concept:name\" in cols\n                    else (\"case\" if \"case\" in cols else None)\n                )\n                act_col = (\n                    \"concept:name\"\n                    if \"concept:name\" in cols\n                    else (\"activity\" if \"activity\" in cols else None)\n                )\n                ts_col = (\n                    \"time:timestamp\"\n                    if \"time:timestamp\" in cols\n                    else (\"timestamp\" if \"timestamp\" in cols else None)\n                )\n                life_col = (\n                    \"lifecycle:transition\"\n                    if \"lifecycle:transition\" in cols\n                    else (\"lifecycle\" if \"lifecycle\" in cols else None)\n                )\n                if case_col is None or act_col is None or ts_col is None:\n                    print(f\"Missing required columns in {fn}, skipping.\")\n                    continue\n                out = pd.DataFrame(\n                    {\n                        \"case_id\": df[case_col].astype(str).values,\n                        \"activity\": df[act_col].astype(str).values,\n                        \"timestamp\": pd.to_datetime(df[ts_col], utc=True),\n                    }\n                )\n                if life_col is not None:\n                    out[\"lifecycle\"] = df[life_col].astype(str).values\n                name = os.path.splitext(fn)[0]\n                datasets[name] = out\n                print(\n                    f\"Loaded {name}: {len(out)} events, {out['case_id'].nunique()} cases\"\n                )\n            except Exception as e:\n                print(f\"Failed to load {fn}: {e}\")\n    return datasets\n\n\n# --------- Prefix building and split ----------\ndef build_prefix_dataset(df, max_prefix_len=10, min_prefix_len=1):\n    df = df.copy()\n    if \"lifecycle\" in df.columns:\n        mask = df[\"lifecycle\"].astype(str).str.lower().eq(\"complete\")\n        if mask.any():\n            df = df[mask]\n    df = df.sort_values([\"case_id\", \"timestamp\"])\n    acts = df[\"activity\"].astype(str).unique().tolist()\n    act2id = {a: i + 1 for i, a in enumerate(sorted(acts))}\n    id2act = {i: a for a, i in act2id.items()}\n    pad_id = 0\n    samples = []\n    for cid, g in df.groupby(\"case_id\"):\n        g = g.sort_values(\"timestamp\")\n        if len(g) < 2:\n            continue\n        g_ts = pd.to_datetime(g[\"timestamp\"], utc=True)\n        ts = (g_ts.astype(\"int64\") // 10**9).to_numpy(np.int64)\n        acts_ids = np.array(\n            [act2id[a] for a in g[\"activity\"].astype(str)], dtype=np.int64\n        )\n        hours = (g_ts.dt.hour.to_numpy(dtype=float) / 23.0).astype(np.float32)\n        weekdays = (g_ts.dt.weekday.to_numpy(dtype=float) / 6.0).astype(np.float32)\n        working = (\n            (g_ts.dt.weekday.to_numpy() < 5)\n            & (g_ts.dt.hour.to_numpy() >= 8)\n            & (g_ts.dt.hour.to_numpy() <= 17)\n        ).astype(np.float32)\n        deltas = np.diff(ts, prepend=ts[0]).astype(np.float32)\n        since_start = (ts - ts[0]).astype(np.float32)\n        feats = np.stack(\n            [deltas, since_start, hours, weekdays, working], axis=1\n        ).astype(np.float32)\n        T = len(acts_ids)\n        max_k = min(max_prefix_len, T - 1)\n        for k in range(min_prefix_len, max_k + 1):\n            samples.append(\n                {\n                    \"case_id\": cid,\n                    \"seq_acts\": acts_ids[:k].tolist(),\n                    \"seq_feats\": feats[:k].copy(),\n                    \"target\": int(acts_ids[k]),\n                    \"prefix_len\": k,\n                }\n            )\n    if len(samples) == 0:\n        return samples, act2id, id2act, pad_id\n    all_feats = np.concatenate(\n        [s[\"seq_feats\"] for s in samples if len(s[\"seq_feats\"]) > 0], axis=0\n    )\n    for s in samples:\n        pass  # initial no norm; will norm on train split\n    return samples, act2id, id2act, pad_id\n\n\ndef time_based_split(df, train_frac=0.7, val_frac=0.15):\n    starts = (\n        df.sort_values(\"timestamp\").groupby(\"case_id\")[\"timestamp\"].min().reset_index()\n    )\n    starts = starts.sort_values(\"timestamp\").reset_index(drop=True)\n    n = len(starts)\n    n_train = int(n * train_frac)\n    n_val = int(n * val_frac)\n    train_cases = set(starts.iloc[:n_train][\"case_id\"])\n    val_cases = set(starts.iloc[n_train : n_train + n_val][\"case_id\"])\n    test_cases = set(starts.iloc[n_train + n_val :][\"case_id\"])\n    return train_cases, val_cases, test_cases\n\n\nclass PrefixDataset(Dataset):\n    def __init__(self, samples, pad_id, max_len=10, num_cont=5):\n        self.samples = samples\n        self.pad_id = pad_id\n        self.max_len = max_len\n        self.num_cont = num_cont\n\n    def __len__(self):\n        return len(self.samples)\n\n    def __getitem__(self, idx):\n        s = self.samples[idx]\n        seq = s[\"seq_acts\"][-self.max_len :]\n        feats = s[\"seq_feats\"][-self.max_len :]\n        L = len(seq)\n        pad_len = self.max_len - L\n        seq_pad = [self.pad_id] * pad_len + seq\n        feats_pad = np.vstack(\n            [\n                np.zeros((pad_len, self.num_cont), dtype=np.float32),\n                feats.astype(np.float32),\n            ]\n        )\n        attn = np.array([0] * pad_len + [1] * L, dtype=np.float32)\n        return {\n            \"acts\": torch.tensor(seq_pad).long(),\n            \"feats\": torch.tensor(feats_pad).float(),\n            \"mask\": torch.tensor(attn).float(),\n            \"y\": torch.tensor(s[\"target\"]).long(),\n            \"prefix_len\": L,\n        }\n\n\nclass LSTMBaseline(nn.Module):\n    def __init__(self, vocab_size, emb_dim=64, cont_dim=5, hidden=128, pad_idx=0):\n        super().__init__()\n        self.emb = nn.Embedding(vocab_size + 1, emb_dim, padding_idx=pad_idx)\n        self.lstm = nn.LSTM(\n            input_size=emb_dim + cont_dim, hidden_size=hidden, batch_first=True\n        )\n        self.dropout = nn.Dropout(0.2)\n        self.fc = nn.Linear(hidden, vocab_size + 1)\n\n    def forward(self, acts, feats, mask):\n        x = self.emb(acts)\n        x = torch.cat([x, feats], dim=-1)\n        out, (h, c) = self.lstm(x)\n        h = self.dropout(h[-1])\n        return self.fc(h)\n\n\ndef collate_fn(batch):\n    out = {\n        k: (\n            torch.stack([b[k] for b in batch], 0)\n            if isinstance(batch[0][k], torch.Tensor)\n            else [b[k] for b in batch]\n        )\n        for k in batch[0].keys()\n    }\n    return out\n\n\ndef evaluate(model, loader, criterion, device, num_classes, pad_idx):\n    model.eval()\n    total_loss = 0.0\n    ys = []\n    yhat = []\n    probs_list = []\n    n = 0\n    top3_correct = 0\n    pref_lens = []\n    top3_flags = []\n    with torch.no_grad():\n        for batch in loader:\n            batch = {\n                k: v.to(device) if isinstance(v, torch.Tensor) else v\n                for k, v in batch.items()\n            }\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = criterion(logits, batch[\"y\"])\n            total_loss += loss.item() * logits.size(0)\n            probs = torch.softmax(logits, dim=1)\n            top1 = torch.argmax(probs, dim=1)\n            k_val = min(3, probs.size(1))\n            _, topk = torch.topk(probs, k=k_val, dim=1)\n            y = batch[\"y\"]\n            ys.extend(y.detach().cpu().tolist())\n            yhat.extend(top1.detach().cpu().tolist())\n            probs_list.append(probs.detach().cpu().numpy())\n            for i in range(y.size(0)):\n                flag = int(y[i].item() in topk[i].detach().cpu().tolist())\n                top3_correct += flag\n                top3_flags.append(flag)\n                pref_lens.append(int(batch[\"prefix_len\"][i].item()))\n            n += y.size(0)\n    avg_loss = total_loss / max(1, n)\n    y_true = np.array(ys)\n    y_pred = np.array(yhat)\n    acc = float(accuracy_score(y_true, y_pred)) if len(y_true) > 0 else 0.0\n    try:\n        f1 = float(f1_score(y_true, y_pred, average=\"macro\"))\n    except:\n        f1 = 0.0\n    top3 = float(top3_correct / max(1, n))\n    probs_concat = (\n        np.concatenate(probs_list, axis=0)\n        if len(probs_list) > 0\n        else np.zeros((0, num_classes + 1))\n    )\n    return (\n        avg_loss,\n        acc,\n        f1,\n        top3,\n        y_true,\n        y_pred,\n        probs_concat,\n        np.array(pref_lens),\n        np.array(top3_flags),\n    )\n\n\ndef train_on_dataset(\n    name, df, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n):\n    print(f\"\\n=== Dataset: {name} ===\")\n    train_cases, val_cases, test_cases = time_based_split(df, 0.7, 0.15)\n    samples_all, act2id, id2act, pad_id = build_prefix_dataset(\n        df, max_prefix_len=max_prefix_len\n    )\n    s_train = [s for s in samples_all if s[\"case_id\"] in train_cases]\n    s_val = [s for s in samples_all if s[\"case_id\"] in val_cases]\n    s_test = [s for s in samples_all if s[\"case_id\"] in test_cases]\n    # normalize time features on train\n    if len(s_train) > 0:\n        feats = np.concatenate(\n            [s[\"seq_feats\"] for s in s_train if len(s[\"seq_feats\"]) > 0], axis=0\n        )\n        dt_mean, dt_std = feats[:, 0].mean(), feats[:, 0].std() + 1e-6\n        ss_mean, ss_std = feats[:, 1].mean(), feats[:, 1].std() + 1e-6\n\n        def norm(samples):\n            for s in samples:\n                if s[\"seq_feats\"].shape[0] > 0:\n                    s[\"seq_feats\"][:, 0] = (s[\"seq_feats\"][:, 0] - dt_mean) / dt_std\n                    s[\"seq_feats\"][:, 1] = (s[\"seq_feats\"][:, 1] - ss_mean) / ss_std\n\n        norm(s_train)\n        norm(s_val)\n        norm(s_test)\n    print(\n        f\"Samples train/val/test: {len(s_train)}/{len(s_val)}/{len(s_test)}; vocab={len(act2id)}\"\n    )\n    if len(s_train) == 0 or len(act2id) < 2:\n        print(\"Insufficient data; skipping.\")\n        return None\n    ds_tr = PrefixDataset(s_train, pad_id, max_prefix_len, 5)\n    ds_va = PrefixDataset(s_val, pad_id, max_prefix_len, 5)\n    ds_te = PrefixDataset(s_test, pad_id, max_prefix_len, 5)\n    dl_tr = DataLoader(\n        ds_tr, batch_size=batch_size, shuffle=True, collate_fn=collate_fn\n    )\n    dl_va = DataLoader(\n        ds_va, batch_size=batch_size, shuffle=False, collate_fn=collate_fn\n    )\n    dl_te = DataLoader(\n        ds_te, batch_size=batch_size, shuffle=False, collate_fn=collate_fn\n    )\n    model = LSTMBaseline(\n        vocab_size=len(act2id), emb_dim=64, cont_dim=5, hidden=128, pad_idx=pad_id\n    ).to(device)\n    crit = nn.CrossEntropyLoss().to(device)\n    opt = torch.optim.Adam(model.parameters(), lr=lr)\n    best_top3 = -1.0\n    best_state = None\n    history = {\"train_loss\": [], \"val_loss\": [], \"val_top3\": []}\n    for ep in range(1, max_epochs + 1):\n        model.train()\n        tot = 0\n        run_loss = 0.0\n        for batch in dl_tr:\n            batch = {\n                k: v.to(device) if isinstance(v, torch.Tensor) else v\n                for k, v in batch.items()\n            }\n            opt.zero_grad()\n            logits = model(batch[\"acts\"], batch[\"feats\"], batch[\"mask\"])\n            loss = crit(logits, batch[\"y\"])\n            loss.backward()\n            opt.step()\n            run_loss += loss.item() * logits.size(0)\n            tot += logits.size(0)\n        tr_loss = run_loss / max(1, tot)\n        va_loss, va_acc, va_f1, va_top3, *_ = evaluate(\n            model, dl_va, crit, device, len(act2id), pad_id\n        )\n        print(\n            f\"Epoch {ep}: val_loss={va_loss:.4f} acc={va_acc:.4f} f1={va_f1:.4f} top3={va_top3:.4f}\"\n        )\n        history[\"train_loss\"].append(tr_loss)\n        history[\"val_loss\"].append(va_loss)\n        history[\"val_top3\"].append(va_top3)\n        if va_top3 > best_top3:\n            best_top3 = va_top3\n            best_state = {\n                k: v.detach().cpu().clone() for k, v in model.state_dict().items()\n            }\n    if best_state is not None:\n        model.load_state_dict(best_state)\n        model.to(device)\n    tr_loss, tr_acc, tr_f1, tr_top3, *_ = evaluate(\n        model, dl_tr, crit, device, len(act2id), pad_id\n    )\n    te_loss, te_acc, te_f1, te_top3, y_true, y_pred, probs, pref_lens, top3_flags = (\n        evaluate(model, dl_te, crit, device, len(act2id), pad_id)\n    )\n    print(\n        f\"[{name}] Test: loss={te_loss:.4f} acc={te_acc:.4f} f1={te_f1:.4f} top3={te_top3:.4f}\"\n    )\n    # package experiment data\n    exp = {\n        \"metrics\": {\n            \"train\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": tr_loss,\n                        \"acc\": tr_acc,\n                        \"macro_f1\": tr_f1,\n                        \"top3\": tr_top3,\n                    },\n                )\n            ],\n            \"val\": [],\n            \"test\": [\n                (\n                    \"final\",\n                    {\n                        \"loss\": te_loss,\n                        \"acc\": te_acc,\n                        \"macro_f1\": te_f1,\n                        \"top3\": te_top3,\n                    },\n                )\n            ],\n        },\n        \"losses\": {\n            \"train\": list(enumerate(history[\"train_loss\"], start=1)),\n            \"val\": list(enumerate(history[\"val_loss\"], start=1)),\n        },\n        \"predictions\": y_pred.tolist(),\n        \"ground_truth\": y_true.tolist(),\n        \"epochs\": list(range(1, len(history[\"train_loss\"]) + 1)),\n        \"probs\": probs,\n        \"prefix_lens\": pref_lens.tolist(),\n        \"top3_flags\": top3_flags.tolist(),\n        \"act2id\": act2id,\n    }\n    # plots for this dataset\n    try:\n        plt.figure()\n        plt.plot(history[\"train_loss\"], label=\"train\")\n        plt.plot(history[\"val_loss\"], label=\"val\")\n        plt.legend()\n        plt.title(f\"Loss Curves - {name}\")\n        plt.xlabel(\"Epoch\")\n        plt.ylabel(\"Loss\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"{name}_loss_curves.png\"))\n        plt.close()\n    except Exception as e:\n        print(f\"Error creating loss curves for {name}: {e}\")\n        plt.close()\n    try:\n        cm = confusion_matrix(y_true, y_pred)\n        plt.figure(figsize=(5, 4))\n        plt.imshow(cm, aspect=\"auto\", cmap=\"Blues\")\n        plt.colorbar()\n        plt.title(f\"Confusion Matrix (Test) - {name}\\nNext-activity\")\n        plt.xlabel(\"Predicted\")\n        plt.ylabel(\"True\")\n        plt.tight_layout()\n        plt.savefig(os.path.join(working_dir, f\"{name}_confusion_matrix.png\"))\n        plt.close()\n    except Exception as e:\n        print(f\"Error creating confusion matrix for {name}: {e}\")\n        plt.close()\n    try:\n        # Top-3 accuracy vs prefix length\n        if len(pref_lens) > 0:\n            d = defaultdict(list)\n            for L, flag in zip(pref_lens, top3_flags):\n                d[int(L)].append(int(flag))\n            xs = sorted(d.keys())\n            ys = [np.mean(d[k]) for k in xs]\n            plt.figure()\n            plt.plot(xs, ys, marker=\"o\")\n            plt.title(f\"Top-3 Accuracy vs Prefix Length - {name}\\nNext-activity\")\n            plt.xlabel(\"Prefix Length\")\n            plt.ylabel(\"Top-3 Accuracy\")\n            plt.tight_layout()\n            plt.savefig(os.path.join(working_dir, f\"{name}_top3_vs_prefixlen.png\"))\n            plt.close()\n    except Exception as e:\n        print(f\"Error creating Top-3 vs prefix length for {name}: {e}\")\n        plt.close()\n    try:\n        # Macro PR curve (one-vs-rest); may be coarse due to many classes\n        if probs.shape[0] > 0:\n            classes = np.unique(y_true)\n            Y = label_binarize(y_true, classes=range(probs.shape[1]))\n            # only keep columns present in classes to avoid PAD\n            present = [c for c in classes]\n            if len(present) > 1:\n                precisions = []\n                recalls = []\n                aps = []\n                for c in present:\n                    p, r, _ = precision_recall_curve(Y[:, c], probs[:, c])\n                    ap = average_precision_score(Y[:, c], probs[:, c])\n                    precisions.append(\n                        np.interp(np.linspace(0, 1, 101), r[::-1], p[::-1])\n                    )\n                    recalls.append(np.linspace(0, 1, 101))\n                    aps.append(ap)\n                macro_p = np.mean(np.stack(precisions, 0), 0)\n                macro_r = np.linspace(0, 1, 101)\n                plt.figure()\n                plt.plot(macro_r, macro_p, label=f\"Macro-PR (mAP={np.mean(aps):.3f})\")\n                plt.title(f\"Macro Precision-Recall (Test) - {name}\\nNext-activity\")\n                plt.xlabel(\"Recall\")\n                plt.ylabel(\"Precision\")\n                plt.legend()\n                plt.tight_layout()\n                plt.savefig(os.path.join(working_dir, f\"{name}_macro_pr.png\"))\n                plt.close()\n    except Exception as e:\n        print(f\"Error creating PR curve for {name}: {e}\")\n        plt.close()\n    return name, exp\n\n\ndef main():\n    datasets = load_xes_folder(data_dir=os.path.join(os.getcwd(), \"data\"))\n    experiment_data = {}\n    for name, df in datasets.items():\n        # optional cap earliest 5000 cases\n        try:\n            starts = (\n                df.sort_values(\"timestamp\")\n                .groupby(\"case_id\")[\"timestamp\"]\n                .min()\n                .reset_index()\n            )\n            if len(starts) > 5000:\n                keep = set(starts.iloc[:5000][\"case_id\"])\n                df = df[df[\"case_id\"].isin(keep)].copy()\n        except:\n            pass\n        res = train_on_dataset(\n            name, df, max_epochs=10, batch_size=128, max_prefix_len=10, lr=1e-3\n        )\n        if res is not None:\n            k, exp = res\n            experiment_data[k] = exp\n    # Save experiment data\n    np.save(os.path.join(working_dir, \"experiment_data.npy\"), experiment_data)\n    # Print evaluation metrics\n    for k, v in experiment_data.items():\n        test_metrics = dict(v[\"metrics\"][\"test\"][0][1])\n        print(\n            f\"{k} | Test acc={test_metrics['acc']:.4f} macro_f1={test_metrics['macro_f1']:.4f} top3={test_metrics['top3']:.4f} loss={test_metrics['loss']:.4f}\"\n        )\n\n    # Secondary plotting pass strictly from experiment_data.npy (as required)\n    try:\n        experiment_data_loaded = np.load(\n            os.path.join(working_dir, \"experiment_data.npy\"), allow_pickle=True\n        ).item()\n    except Exception as e:\n        print(f\"Error loading experiment data: {e}\")\n        experiment_data_loaded = {}\n    for name, ed in experiment_data_loaded.items():\n        try:\n            # re-plot loss curves from saved data\n            plt.figure()\n            tl = [y for (_, y) in ed.get(\"losses\", {}).get(\"train\", [])]\n            vl = [y for (_, y) in ed.get(\"losses\", {}).get(\"val\", [])]\n            if len(tl) > 0:\n                plt.plot(tl, label=\"train\")\n            if len(vl) > 0:\n                plt.plot(vl, label=\"val\")\n            plt.legend()\n            plt.title(f\"Loss Curves - {name}\\nNext-activity\")\n            plt.xlabel(\"Epoch\")\n            plt.ylabel(\"Loss\")\n            plt.tight_layout()\n            plt.savefig(os.path.join(working_dir, f\"{name}_loss_curves_reload.png\"))\n            plt.close()\n        except Exception as e:\n            print(f\"Error creating plot1: {e}\")\n            plt.close()\n        try:\n            # confusion matrix from predictions and ground truth\n            y_true = ed.get(\"ground_truth\", [])\n            y_pred = ed.get(\"predictions\", [])\n            if len(y_true) > 0 and len(y_pred) > 0:\n                cm = confusion_matrix(y_true, y_pred)\n                plt.figure(figsize=(5, 4))\n                plt.imshow(cm, aspect=\"auto\", cmap=\"Blues\")\n                plt.colorbar()\n                plt.title(f\"Confusion Matrix (Test) - {name}\\nNext-activity\")\n                plt.xlabel(\"Predicted\")\n                plt.ylabel(\"True\")\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(working_dir, f\"{name}_confusion_matrix_reload.png\")\n                )\n                plt.close()\n        except Exception as e:\n            print(f\"Error creating plot2: {e}\")\n            plt.close()\n        try:\n            # Top-3 vs prefix length if present\n            pref = ed.get(\"prefix_lens\", [])\n            flags = ed.get(\"top3_flags\", [])\n            if len(pref) > 0 and len(flags) > 0:\n                d = defaultdict(list)\n                for L, f in zip(pref, flags):\n                    d[int(L)].append(int(f))\n                xs = sorted(d.keys())\n                ys = [float(np.mean(d[x])) for x in xs]\n                plt.figure()\n                plt.plot(xs, ys, marker=\"o\")\n                plt.title(f\"Top-3 Accuracy vs Prefix Length - {name}\\nNext-activity\")\n                plt.xlabel(\"Prefix Length\")\n                plt.ylabel(\"Top-3 Accuracy\")\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(working_dir, f\"{name}_top3_vs_prefixlen_reload.png\")\n                )\n                plt.close()\n        except Exception as e:\n            print(f\"Error creating plot3: {e}\")\n            plt.close()\n        try:\n            # Macro PR curve if probs available\n            probs = np.array(ed.get(\"probs\", []))\n            y_true = ed.get(\"ground_truth\", [])\n            if probs.size > 0 and len(y_true) > 0:\n                classes = sorted(set(y_true))\n                Y = label_binarize(np.array(y_true), classes=range(probs.shape[1]))\n                present = classes\n                if len(present) > 1:\n                    precisions = []\n                    aps = []\n                    grid = np.linspace(0, 1, 101)\n                    for c in present:\n                        p, r, _ = precision_recall_curve(Y[:, c], probs[:, c])\n                        precisions.append(np.interp(grid, r[::-1], p[::-1]))\n                        aps.append(average_precision_score(Y[:, c], probs[:, c]))\n                    macro_p = np.mean(np.stack(precisions, 0), 0)\n                    plt.figure()\n                    plt.plot(grid, macro_p, label=f\"mAP={np.mean(aps):.3f}\")\n                    plt.title(f\"Macro Precision-Recall (Test) - {name}\\nNext-activity\")\n                    plt.xlabel(\"Recall\")\n                    plt.ylabel(\"Precision\")\n                    plt.legend()\n                    plt.tight_layout()\n                    plt.savefig(\n                        os.path.join(working_dir, f\"{name}_macro_pr_reload.png\")\n                    )\n                    plt.close()\n        except Exception as e:\n            print(f\"Error creating plot4: {e}\")\n            plt.close()\n\n\nif __name__ == \"__main__\":\n    main()\n","plot_plan":null,"step":12,"id":"852328dac5e14beb9bfce93a32da5a6a","ctime":1757762453.9858685,"_term_out":["Using device: cuda","\n","[data] Using discovered data dir: /workspace/data","\n","[data] Available in /workspace/data: ['BPI_Challenge_2012.xes', 'BPI_Challenge_2017.xes', 'Road_Traffic_Fine_Management_Process.xes']","\n","[data] Loading XES: /workspace/data/BPI_Challenge_2012.xes","\n","\rparsing log, completed traces ::   0%|          | 0/13087 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 1/13087 [00:00<21:53,  9.96it/s]","\rparsing log, completed traces ::   1%|1         | 154/13087 [00:00<00:14, 902.53it/s]","\rparsing log, completed traces ::   2%|2         | 269/13087 [00:00<00:37, 344.14it/s]","\rparsing log, completed traces ::   3%|3         | 426/13087 [00:00<00:22, 565.77it/s]","\rparsing log, completed traces ::   5%|4         | 599/13087 [00:00<00:15, 801.74it/s]","\rparsing log, completed traces ::   6%|6         | 789/13087 [00:01<00:11, 1050.02it/s]","\rparsing log, completed traces ::   7%|7         | 951/13087 [00:01<00:10, 1188.96it/s]","\rparsing log, completed traces ::   9%|8         | 1114/13087 [00:01<00:09, 1301.43it/s]","\rparsing log, completed traces ::  10%|9         | 1284/13087 [00:01<00:08, 1408.79it/s]","\rparsing log, completed traces ::  11%|#1        | 1487/13087 [00:01<00:07, 1579.97it/s]","\rparsing log, completed traces ::  13%|#2        | 1668/13087 [00:01<00:06, 1641.38it/s]","\rparsing log, completed traces ::  14%|#4        | 1843/13087 [00:01<00:06, 1669.42it/s]","\rparsing log, completed traces ::  15%|#5        | 2018/13087 [00:01<00:06, 1666.39it/s]","\rparsing log, completed traces ::  17%|#6        | 2190/13087 [00:01<00:06, 1672.91it/s]","\rparsing log, completed traces ::  18%|#8        | 2374/13087 [00:01<00:06, 1720.67it/s]","\rparsing log, completed traces ::  20%|#9        | 2552/13087 [00:02<00:06, 1737.81it/s]","\rparsing log, completed traces ::  21%|##        | 2728/13087 [00:02<00:05, 1731.46it/s]","\rparsing log, completed traces ::  22%|##2       | 2903/13087 [00:02<00:06, 1677.68it/s]","\rparsing log, completed traces ::  23%|##3       | 3073/13087 [00:02<00:06, 1642.98it/s]","\rparsing log, completed traces ::  25%|##4       | 3265/13087 [00:02<00:05, 1722.37it/s]","\rparsing log, completed traces ::  26%|##6       | 3439/13087 [00:02<00:11, 832.77it/s] ","\rparsing log, completed traces ::  28%|##7       | 3630/13087 [00:03<00:09, 1012.68it/s]","\rparsing log, completed traces ::  29%|##9       | 3806/13087 [00:03<00:08, 1155.37it/s]","\rparsing log, completed traces ::  31%|###       | 4002/13087 [00:03<00:06, 1326.79it/s]","\rparsing log, completed traces ::  33%|###2      | 4278/13087 [00:03<00:05, 1660.09it/s]","\rparsing log, completed traces ::  34%|###4      | 4482/13087 [00:03<00:04, 1755.45it/s]","\rparsing log, completed traces ::  36%|###5      | 4696/13087 [00:03<00:04, 1855.32it/s]","\rparsing log, completed traces ::  37%|###7      | 4901/13087 [00:03<00:04, 1855.45it/s]","\rparsing log, completed traces ::  39%|###8      | 5101/13087 [00:03<00:04, 1852.06it/s]","\rparsing log, completed traces ::  40%|####      | 5296/13087 [00:03<00:04, 1838.79it/s]","\rparsing log, completed traces ::  42%|####1     | 5487/13087 [00:03<00:04, 1761.00it/s]","\rparsing log, completed traces ::  43%|####3     | 5669/13087 [00:04<00:04, 1744.64it/s]","\rparsing log, completed traces ::  45%|####4     | 5847/13087 [00:04<00:04, 1737.24it/s]","\rparsing log, completed traces ::  46%|####6     | 6039/13087 [00:04<00:03, 1788.52it/s]","\rparsing log, completed traces ::  48%|####7     | 6220/13087 [00:04<00:03, 1753.15it/s]","\rparsing log, completed traces ::  49%|####9     | 6430/13087 [00:04<00:03, 1851.91it/s]","\rparsing log, completed traces ::  51%|#####     | 6617/13087 [00:04<00:03, 1768.15it/s]","\rparsing log, completed traces ::  52%|#####1    | 6796/13087 [00:04<00:03, 1746.48it/s]","\rparsing log, completed traces ::  53%|#####3    | 6972/13087 [00:04<00:03, 1670.77it/s]","\rparsing log, completed traces ::  55%|#####4    | 7151/13087 [00:04<00:03, 1698.30it/s]","\rparsing log, completed traces ::  56%|#####5    | 7322/13087 [00:05<00:07, 742.98it/s] ","\rparsing log, completed traces ::  57%|#####7    | 7468/13087 [00:05<00:06, 850.82it/s]","\rparsing log, completed traces ::  58%|#####8    | 7628/13087 [00:05<00:05, 981.02it/s]","\rparsing log, completed traces ::  60%|#####9    | 7798/13087 [00:05<00:04, 1123.74it/s]","\rparsing log, completed traces ::  61%|######    | 7948/13087 [00:05<00:04, 1195.85it/s]","\rparsing log, completed traces ::  62%|######2   | 8118/13087 [00:06<00:03, 1316.06it/s]","\rparsing log, completed traces ::  63%|######3   | 8296/13087 [00:06<00:03, 1430.02it/s]","\rparsing log, completed traces ::  65%|######4   | 8465/13087 [00:06<00:03, 1496.67it/s]","\rparsing log, completed traces ::  66%|######6   | 8638/13087 [00:06<00:02, 1557.24it/s]","\rparsing log, completed traces ::  67%|######7   | 8808/13087 [00:06<00:02, 1591.04it/s]","\rparsing log, completed traces ::  69%|######8   | 8975/13087 [00:06<00:02, 1606.38it/s]","\rparsing log, completed traces ::  70%|######9   | 9141/13087 [00:06<00:02, 1568.21it/s]","\rparsing log, completed traces ::  71%|#######1  | 9331/13087 [00:06<00:02, 1660.56it/s]","\rparsing log, completed traces ::  73%|#######2  | 9501/13087 [00:06<00:02, 1628.30it/s]","\rparsing log, completed traces ::  74%|#######3  | 9666/13087 [00:06<00:02, 1587.54it/s]","\rparsing log, completed traces ::  75%|#######5  | 9841/13087 [00:07<00:01, 1629.85it/s]","\rparsing log, completed traces ::  76%|#######6  | 10006/13087 [00:07<00:01, 1593.61it/s]","\rparsing log, completed traces ::  78%|#######7  | 10169/13087 [00:07<00:01, 1599.75it/s]","\rparsing log, completed traces ::  79%|#######8  | 10330/13087 [00:07<00:01, 1567.74it/s]","\rparsing log, completed traces ::  80%|########  | 10488/13087 [00:07<00:01, 1566.41it/s]","\rparsing log, completed traces ::  81%|########1 | 10655/13087 [00:07<00:01, 1595.38it/s]","\rparsing log, completed traces ::  83%|########2 | 10832/13087 [00:07<00:01, 1644.68it/s]","\rparsing log, completed traces ::  84%|########4 | 11024/13087 [00:07<00:01, 1724.69it/s]","\rparsing log, completed traces ::  86%|########5 | 11198/13087 [00:07<00:01, 1729.21it/s]","\rparsing log, completed traces ::  87%|########7 | 11389/13087 [00:07<00:00, 1782.62it/s]","\rparsing log, completed traces ::  88%|########8 | 11568/13087 [00:08<00:02, 747.46it/s] ","\rparsing log, completed traces ::  90%|########9 | 11764/13087 [00:08<00:01, 930.20it/s]","\rparsing log, completed traces ::  92%|#########1| 11978/13087 [00:08<00:00, 1144.23it/s]","\rparsing log, completed traces ::  93%|#########2| 12167/13087 [00:08<00:00, 1295.06it/s]","\rparsing log, completed traces ::  95%|#########4| 12380/13087 [00:08<00:00, 1481.48it/s]","\rparsing log, completed traces ::  96%|#########6| 12583/13087 [00:09<00:00, 1614.12it/s]","\rparsing log, completed traces ::  98%|#########7| 12776/13087 [00:09<00:00, 1694.12it/s]","\rparsing log, completed traces ::  99%|#########9| 12975/13087 [00:09<00:00, 1769.43it/s]","","\rparsing log, completed traces :: 100%|##########| 13087/13087 [00:09<00:00, 1411.03it/s]","\n","[data] Loading XES: /workspace/data/BPI_Challenge_2017.xes","\n","\rparsing log, completed traces ::   0%|          | 0/31509 [00:00<?, ?it/s]","\rparsing log, completed traces ::   0%|          | 1/31509 [00:00<4:35:20,  1.91it/s]","\rparsing log, completed traces ::   0%|          | 68/31509 [00:00<03:37, 144.58it/s]","\rparsing log, completed traces ::   0%|          | 127/31509 [00:00<02:06, 248.30it/s]","\rparsing log, completed traces ::   1%|          | 195/31509 [00:00<01:28, 355.58it/s]","\rparsing log, completed traces ::   1%|          | 257/31509 [00:00<01:13, 424.37it/s]","\rparsing log, completed traces ::   1%|1         | 323/31509 [00:01<01:04, 486.51it/s]","\rparsing log, completed traces ::   1%|1         | 388/31509 [00:01<00:58, 530.42it/s]","\rparsing log, completed traces ::   1%|1         | 450/31509 [00:01<00:56, 550.78it/s]","\rparsing log, completed traces ::   2%|1         | 516/31509 [00:01<00:53, 579.78it/s]","\rparsing log, completed traces ::   2%|1         | 579/31509 [00:01<00:53, 583.43it/s]","\rparsing log, completed traces ::   2%|2         | 649/31509 [00:01<00:50, 614.24it/s]","\rparsing log, completed traces ::   2%|2         | 720/31509 [00:01<00:48, 640.01it/s]","\rparsing log, completed traces ::   2%|2         | 786/31509 [00:01<00:48, 632.98it/s]","\rparsing log, completed traces ::   3%|2         | 851/31509 [00:01<00:48, 634.54it/s]","\rparsing log, completed traces ::   3%|2         | 917/31509 [00:01<00:47, 638.80it/s]","\rparsing log, completed traces ::   3%|3         | 990/31509 [00:02<00:45, 664.56it/s]","\rparsing log, completed traces ::   3%|3         | 1057/31509 [00:02<00:47, 647.84it/s]","\rparsing log, completed traces ::   4%|3         | 1125/31509 [00:02<00:46, 654.29it/s]","\rparsing log, completed traces ::   4%|3         | 1195/31509 [00:02<00:45, 666.62it/s]","\rparsing log, completed traces ::   4%|4         | 1267/31509 [00:02<00:44, 681.62it/s]","\rparsing log, completed traces ::   4%|4         | 1336/31509 [00:02<00:45, 666.36it/s]","\rparsing log, completed traces ::   4%|4         | 1403/31509 [00:02<00:45, 662.35it/s]","\rparsing log, completed traces ::   5%|4         | 1470/31509 [00:03<01:41, 296.82it/s]","\rparsing log, completed traces ::   5%|4         | 1536/31509 [00:03<01:24, 353.33it/s]","\rparsing log, completed traces ::   5%|5         | 1602/31509 [00:03<01:13, 408.85it/s]","\rparsing log, completed traces ::   5%|5         | 1664/31509 [00:03<01:05, 452.20it/s]","\rparsing log, completed traces ::   5%|5         | 1732/31509 [00:03<00:59, 503.26it/s]","\rparsing log, completed traces ::   6%|5         | 1794/31509 [00:03<00:56, 523.59it/s]","\rparsing log, completed traces ::   6%|5         | 1855/31509 [00:03<00:55, 538.87it/s]","\rparsing log, completed traces ::   6%|6         | 1920/31509 [00:03<00:52, 566.73it/s]","\rparsing log, completed traces ::   6%|6         | 1986/31509 [00:04<00:49, 591.52it/s]","\rparsing log, completed traces ::   7%|6         | 2050/31509 [00:04<00:48, 604.04it/s]","\rparsing log, completed traces ::   7%|6         | 2118/31509 [00:04<00:47, 622.30it/s]","\rparsing log, completed traces ::   7%|6         | 2186/31509 [00:04<00:45, 638.12it/s]","\rparsing log, completed traces ::   7%|7         | 2254/31509 [00:04<00:45, 648.54it/s]","\rparsing log, completed traces ::   7%|7         | 2322/31509 [00:04<00:44, 655.92it/s]","\rparsing log, completed traces ::   8%|7         | 2389/31509 [00:04<00:44, 652.21it/s]","\rparsing log, completed traces ::   8%|7         | 2458/31509 [00:04<00:43, 662.25it/s]","\rparsing log, completed traces ::   8%|8         | 2525/31509 [00:04<00:43, 659.26it/s]","\rparsing log, completed traces ::   8%|8         | 2601/31509 [00:04<00:42, 686.24it/s]","\rparsing log, completed traces ::   8%|8         | 2670/31509 [00:05<00:42, 684.03it/s]","\rparsing log, completed traces ::   9%|8         | 2739/31509 [00:05<00:42, 672.08it/s]","\rparsing log, completed traces ::   9%|8         | 2811/31509 [00:05<00:41, 684.29it/s]","\rparsing log, completed traces ::   9%|9         | 2887/31509 [00:05<00:40, 705.46it/s]","\rparsing log, completed traces ::   9%|9         | 2958/31509 [00:05<01:28, 323.49it/s]","\rparsing log, completed traces ::  10%|9         | 3028/31509 [00:05<01:14, 384.25it/s]","\rparsing log, completed traces ::  10%|9         | 3095/31509 [00:06<01:05, 436.70it/s]","\rparsing log, completed traces ::  10%|#         | 3160/31509 [00:06<00:58, 481.33it/s]","\rparsing log, completed traces ::  10%|#         | 3222/31509 [00:06<00:55, 510.90it/s]","\rparsing log, completed traces ::  10%|#         | 3298/31509 [00:06<00:49, 571.78it/s]","\rparsing log, completed traces ::  11%|#         | 3371/31509 [00:06<00:45, 612.62it/s]","\rparsing log, completed traces ::  11%|#         | 3449/31509 [00:06<00:42, 656.64it/s]","\rparsing log, completed traces ::  11%|#1        | 3524/31509 [00:06<00:41, 679.43it/s]","\rparsing log, completed traces ::  11%|#1        | 3596/31509 [00:06<00:41, 676.23it/s]","\rparsing log, completed traces ::  12%|#1        | 3669/31509 [00:06<00:40, 688.79it/s]","\rparsing log, completed traces ::  12%|#1        | 3742/31509 [00:06<00:39, 697.33it/s]","\rparsing log, completed traces ::  12%|#2        | 3814/31509 [00:07<00:40, 687.41it/s]","\rparsing log, completed traces ::  12%|#2        | 3884/31509 [00:07<00:40, 688.90it/s]","\rparsing log, completed traces ::  13%|#2        | 3955/31509 [00:07<00:39, 694.71it/s]","\rparsing log, completed traces ::  13%|#2        | 4028/31509 [00:07<00:39, 700.61it/s]","\rparsing log, completed traces ::  13%|#3        | 4100/31509 [00:07<00:38, 706.00it/s]","\rparsing log, completed traces ::  13%|#3        | 4171/31509 [00:07<00:39, 696.02it/s]","\rparsing log, completed traces ::  13%|#3        | 4241/31509 [00:07<00:39, 684.76it/s]","\rparsing log, completed traces ::  14%|#3        | 4310/31509 [00:07<00:40, 672.61it/s]","\rparsing log, completed traces ::  14%|#3        | 4380/31509 [00:07<00:39, 679.63it/s]","\rparsing log, completed traces ::  14%|#4        | 4449/31509 [00:07<00:40, 673.68it/s]","\rparsing log, completed traces ::  14%|#4        | 4519/31509 [00:08<00:39, 679.94it/s]","\rparsing log, completed traces ::  15%|#4        | 4589/31509 [00:08<00:39, 682.96it/s]","\rparsing log, completed traces ::  15%|#4        | 4663/31509 [00:08<00:38, 696.66it/s]","\rparsing log, completed traces ::  15%|#5        | 4733/31509 [00:08<01:31, 291.45it/s]","\rparsing log, completed traces ::  15%|#5        | 4800/31509 [00:08<01:16, 347.27it/s]","\rparsing log, completed traces ::  15%|#5        | 4873/31509 [00:09<01:04, 413.94it/s]","\rparsing log, completed traces ::  16%|#5        | 4942/31509 [00:09<00:56, 468.28it/s]","\rparsing log, completed traces ::  16%|#5        | 5012/31509 [00:09<00:51, 518.97it/s]","\rparsing log, completed traces ::  16%|#6        | 5088/31509 [00:09<00:45, 576.05it/s]","\rparsing log, completed traces ::  16%|#6        | 5158/31509 [00:09<00:43, 603.70it/s]","\rparsing log, completed traces ::  17%|#6        | 5230/31509 [00:09<00:41, 633.63it/s]","\rparsing log, completed traces ::  17%|#6        | 5302/31509 [00:09<00:40, 652.96it/s]","\rparsing log, completed traces ::  17%|#7        | 5372/31509 [00:09<00:39, 662.73it/s]","\rparsing log, completed traces ::  17%|#7        | 5442/31509 [00:09<00:38, 668.50it/s]","\rparsing log, completed traces ::  18%|#7        | 5517/31509 [00:09<00:37, 690.84it/s]","\rparsing log, completed traces ::  18%|#7        | 5591/31509 [00:10<00:36, 701.72it/s]","\rparsing log, completed traces ::  18%|#7        | 5666/31509 [00:10<00:36, 715.33it/s]","\rparsing log, completed traces ::  18%|#8        | 5747/31509 [00:10<00:34, 740.42it/s]","\rparsing log, completed traces ::  18%|#8        | 5822/31509 [00:10<00:35, 728.79it/s]","\rparsing log, completed traces ::  19%|#8        | 5898/31509 [00:10<00:34, 737.12it/s]","\rparsing log, completed traces ::  19%|#8        | 5976/31509 [00:10<00:34, 748.31it/s]","\rparsing log, completed traces ::  19%|#9        | 6052/31509 [00:10<00:35, 723.15it/s]","\rparsing log, completed traces ::  19%|#9        | 6125/31509 [00:10<00:36, 702.70it/s]","\rparsing log, completed traces ::  20%|#9        | 6197/31509 [00:10<00:35, 705.41it/s]","\rparsing log, completed traces ::  20%|#9        | 6270/31509 [00:11<00:35, 709.39it/s]","\rparsing log, completed traces ::  20%|##        | 6342/31509 [00:11<00:35, 699.92it/s]","\rparsing log, completed traces ::  20%|##        | 6416/31509 [00:11<00:35, 710.66it/s]","\rparsing log, completed traces ::  21%|##        | 6488/31509 [00:11<00:35, 701.62it/s]","\rparsing log, completed traces ::  21%|##        | 6559/31509 [00:11<00:37, 669.26it/s]","\rparsing log, completed traces ::  21%|##1       | 6629/31509 [00:11<00:36, 674.27it/s]","\rparsing log, completed traces ::  21%|##1       | 6697/31509 [00:12<01:31, 270.76it/s]","\rparsing log, completed traces ::  21%|##1       | 6768/31509 [00:12<01:14, 332.20it/s]","\rparsing log, completed traces ::  22%|##1       | 6834/31509 [00:12<01:03, 386.98it/s]","\rparsing log, completed traces ::  22%|##1       | 6905/31509 [00:12<00:54, 448.85it/s]","\rparsing log, completed traces ::  22%|##2       | 6973/31509 [00:12<00:49, 498.50it/s]","\rparsing log, completed traces ::  22%|##2       | 7052/31509 [00:12<00:43, 566.36it/s]","\rparsing log, completed traces ::  23%|##2       | 7125/31509 [00:12<00:40, 607.14it/s]","\rparsing log, completed traces ::  23%|##2       | 7195/31509 [00:12<00:39, 615.49it/s]","\rparsing log, completed traces ::  23%|##3       | 7264/31509 [00:12<00:38, 633.07it/s]","\rparsing log, completed traces ::  23%|##3       | 7332/31509 [00:13<00:37, 639.96it/s]","\rparsing log, completed traces ::  23%|##3       | 7400/31509 [00:13<00:37, 648.83it/s]","\rparsing log, completed traces ::  24%|##3       | 7471/31509 [00:13<00:36, 665.44it/s]","\rparsing log, completed traces ::  24%|##3       | 7549/31509 [00:13<00:34, 697.04it/s]","\rparsing log, completed traces ::  24%|##4       | 7621/31509 [00:13<00:34, 690.83it/s]","\rparsing log, completed traces ::  24%|##4       | 7692/31509 [00:13<00:34, 684.15it/s]","\rparsing log, completed traces ::  25%|##4       | 7762/31509 [00:13<00:35, 674.58it/s]","\rparsing log, completed traces ::  25%|##4       | 7830/31509 [00:13<00:35, 674.11it/s]","\rparsing log, completed traces ::  25%|##5       | 7902/31509 [00:13<00:34, 686.33it/s]","\rparsing log, completed traces ::  25%|##5       | 7972/31509 [00:14<00:34, 687.77it/s]","\rparsing log, completed traces ::  26%|##5       | 8043/31509 [00:14<00:33, 692.51it/s]","\rparsing log, completed traces ::  26%|##5       | 8113/31509 [00:14<00:33, 689.02it/s]","\rparsing log, completed traces ::  26%|##5       | 8186/31509 [00:14<00:33, 700.71it/s]","\rparsing log, completed traces ::  26%|##6       | 8257/31509 [00:14<00:33, 696.24it/s]","\rparsing log, completed traces ::  26%|##6       | 8332/31509 [00:14<00:32, 709.23it/s]","\rparsing log, completed traces ::  27%|##6       | 8403/31509 [00:14<00:33, 690.22it/s]","\rparsing log, completed traces ::  27%|##6       | 8475/31509 [00:14<00:33, 697.39it/s]","\rparsing log, completed traces ::  27%|##7       | 8545/31509 [00:14<00:33, 678.91it/s]","\rparsing log, completed traces ::  27%|##7       | 8616/31509 [00:14<00:33, 683.10it/s]","\rparsing log, completed traces ::  28%|##7       | 8685/31509 [00:15<00:33, 681.39it/s]","\rparsing log, completed traces ::  28%|##7       | 8757/31509 [00:15<00:32, 690.66it/s]","\rparsing log, completed traces ::  28%|##8       | 8827/31509 [00:15<01:30, 249.90it/s]","\rparsing log, completed traces ::  28%|##8       | 8893/31509 [00:15<01:14, 303.34it/s]","\rparsing log, completed traces ::  28%|##8       | 8962/31509 [00:16<01:01, 363.92it/s]","\rparsing log, completed traces ::  29%|##8       | 9023/31509 [00:16<00:55, 408.83it/s]","\rparsing log, completed traces ::  29%|##8       | 9090/31509 [00:16<00:48, 462.87it/s]","\rparsing log, completed traces ::  29%|##9       | 9158/31509 [00:16<00:43, 511.31it/s]","\rparsing log, completed traces ::  29%|##9       | 9222/31509 [00:16<00:41, 539.34it/s]","\rparsing log, completed traces ::  29%|##9       | 9287/31509 [00:16<00:39, 566.67it/s]","\rparsing log, completed traces ::  30%|##9       | 9361/31509 [00:16<00:36, 612.39it/s]","\rparsing log, completed traces ::  30%|##9       | 9428/31509 [00:16<00:35, 615.22it/s]","\rparsing log, completed traces ::  30%|###       | 9494/31509 [00:16<00:35, 619.65it/s]","\rparsing log, completed traces ::  30%|###       | 9563/31509 [00:16<00:34, 639.04it/s]","\rparsing log, completed traces ::  31%|###       | 9631/31509 [00:17<00:33, 647.89it/s]","\rparsing log, completed traces ::  31%|###       | 9698/31509 [00:17<00:34, 637.10it/s]","\rparsing log, completed traces ::  31%|###       | 9764/31509 [00:17<00:33, 641.87it/s]","\rparsing log, completed traces ::  31%|###1      | 9830/31509 [00:17<00:33, 646.86it/s]","\rparsing log, completed traces ::  31%|###1      | 9896/31509 [00:17<00:33, 641.84it/s]","\rparsing log, completed traces ::  32%|###1      | 9963/31509 [00:17<00:33, 649.71it/s]","\rparsing log, completed traces ::  32%|###1      | 10029/31509 [00:17<00:33, 641.44it/s]","\rparsing log, completed traces ::  32%|###2      | 10094/31509 [00:17<00:34, 625.08it/s]","\rparsing log, completed traces ::  32%|###2      | 10159/31509 [00:17<00:33, 631.37it/s]","\rparsing log, completed traces ::  32%|###2      | 10227/31509 [00:18<00:32, 645.52it/s]","\rparsing log, completed traces ::  33%|###2      | 10294/31509 [00:18<00:32, 652.62it/s]","\rparsing log, completed traces ::  33%|###2      | 10360/31509 [00:18<00:33, 623.87it/s]","\rparsing log, completed traces ::  33%|###3      | 10427/31509 [00:18<00:33, 636.49it/s]","\rparsing log, completed traces ::  33%|###3      | 10491/31509 [00:18<00:33, 630.87it/s]","\rparsing log, completed traces ::  34%|###3      | 10556/31509 [00:18<00:32, 635.29it/s]","\rparsing log, completed traces ::  34%|###3      | 10620/31509 [00:18<00:33, 631.50it/s]","\rparsing log, completed traces ::  34%|###3      | 10685/31509 [00:18<00:32, 635.18it/s]","\rparsing log, completed traces ::  34%|###4      | 10749/31509 [00:18<00:33, 628.94it/s]","\rparsing log, completed traces ::  34%|###4      | 10812/31509 [00:18<00:33, 616.24it/s]","\rparsing log, completed traces ::  35%|###4      | 10874/31509 [00:19<00:34, 604.38it/s]","\rparsing log, completed traces ::  35%|###4      | 10936/31509 [00:19<00:33, 608.86it/s]","\rparsing log, completed traces ::  35%|###4      | 11001/31509 [00:19<00:33, 619.73it/s]","\rparsing log, completed traces ::  35%|###5      | 11069/31509 [00:19<00:32, 636.98it/s]","\rparsing log, completed traces ::  35%|###5      | 11133/31509 [00:20<01:29, 226.91it/s]","\rparsing log, completed traces ::  36%|###5      | 11195/31509 [00:20<01:13, 278.02it/s]","\rparsing log, completed traces ::  36%|###5      | 11265/31509 [00:20<00:58, 344.01it/s]","\rparsing log, completed traces ::  36%|###5      | 11336/31509 [00:20<00:49, 409.57it/s]","\rparsing log, completed traces ::  36%|###6      | 11398/31509 [00:20<00:44, 451.98it/s]","\rparsing log, completed traces ::  36%|###6      | 11461/31509 [00:20<00:40, 491.30it/s]","\rparsing log, completed traces ::  37%|###6      | 11523/31509 [00:20<00:38, 522.03it/s]","\rparsing log, completed traces ::  37%|###6      | 11591/31509 [00:20<00:35, 561.41it/s]","\rparsing log, completed traces ::  37%|###6      | 11656/31509 [00:20<00:34, 583.06it/s]","\rparsing log, completed traces ::  37%|###7      | 11720/31509 [00:20<00:33, 597.90it/s]","\rparsing log, completed traces ::  37%|###7      | 11790/31509 [00:21<00:31, 625.92it/s]","\rparsing log, completed traces ::  38%|###7      | 11857/31509 [00:21<00:30, 638.41it/s]","\rparsing log, completed traces ::  38%|###7      | 11930/31509 [00:21<00:29, 664.09it/s]","\rparsing log, completed traces ::  38%|###8      | 11998/31509 [00:21<00:29, 664.00it/s]","\rparsing log, completed traces ::  38%|###8      | 12067/31509 [00:21<00:29, 667.83it/s]","\rparsing log, completed traces ::  39%|###8      | 12136/31509 [00:21<00:28, 673.30it/s]","\rparsing log, completed traces ::  39%|###8      | 12204/31509 [00:21<00:28, 670.84it/s]","\rparsing log, completed traces ::  39%|###8      | 12272/31509 [00:21<00:28, 668.53it/s]","\rparsing log, completed traces ::  39%|###9      | 12342/31509 [00:21<00:28, 676.65it/s]","\rparsing log, completed traces ::  39%|###9      | 12410/31509 [00:21<00:28, 672.77it/s]","\rparsing log, completed traces ::  40%|###9      | 12478/31509 [00:22<00:28, 672.41it/s]","\rparsing log, completed traces ::  40%|###9      | 12546/31509 [00:22<00:28, 657.31it/s]","\rparsing log, completed traces ::  40%|####      | 12614/31509 [00:22<00:28, 662.31it/s]","\rparsing log, completed traces ::  40%|####      | 12682/31509 [00:22<00:28, 664.83it/s]","\rparsing log, completed traces ::  40%|####      | 12754/31509 [00:22<00:27, 678.18it/s]","\rparsing log, completed traces ::  41%|####      | 12822/31509 [00:22<00:27, 673.80it/s]","\rparsing log, completed traces ::  41%|####      | 12890/31509 [00:22<00:28, 660.79it/s]","\rparsing log, completed traces ::  41%|####1     | 12957/31509 [00:22<00:28, 655.05it/s]","\rparsing log, completed traces ::  41%|####1     | 13026/31509 [00:22<00:27, 662.79it/s]","\rparsing log, completed traces ::  42%|####1     | 13103/31509 [00:23<00:26, 692.25it/s]","\rparsing log, completed traces ::  42%|####1     | 13173/31509 [00:23<00:27, 676.71it/s]","\rparsing log, completed traces ::  42%|####2     | 13241/31509 [00:23<00:27, 663.30it/s]","\rparsing log, completed traces ::  42%|####2     | 13309/31509 [00:23<00:27, 664.88it/s]","\rparsing log, completed traces ::  42%|####2     | 13378/31509 [00:23<00:27, 670.25it/s]","\rparsing log, completed traces ::  43%|####2     | 13446/31509 [00:23<00:27, 661.87it/s]","\rparsing log, completed traces ::  43%|####2     | 13514/31509 [00:23<00:26, 667.04it/s]","\rparsing log, completed traces ::  43%|####3     | 13581/31509 [00:23<00:27, 660.43it/s]","\rparsing log, completed traces ::  43%|####3     | 13648/31509 [00:23<00:27, 651.15it/s]","\rparsing log, completed traces ::  44%|####3     | 13714/31509 [00:23<00:27, 653.23it/s]","\rparsing log, completed traces ::  44%|####3     | 13780/31509 [00:24<01:24, 208.74it/s]","\rparsing log, completed traces ::  44%|####3     | 13847/31509 [00:24<01:07, 263.03it/s]","\rparsing log, completed traces ::  44%|####4     | 13909/31509 [00:24<00:55, 314.50it/s]","\rparsing log, completed traces ::  44%|####4     | 13977/31509 [00:25<00:46, 375.78it/s]","\rparsing log, completed traces ::  45%|####4     | 14050/31509 [00:25<00:39, 444.16it/s]","\rparsing log, completed traces ::  45%|####4     | 14117/31509 [00:25<00:35, 493.25it/s]","\rparsing log, completed traces ::  45%|####5     | 14185/31509 [00:25<00:32, 536.85it/s]","\rparsing log, completed traces ::  45%|####5     | 14254/31509 [00:25<00:30, 574.20it/s]","\rparsing log, completed traces ::  45%|####5     | 14325/31509 [00:25<00:28, 605.03it/s]","\rparsing log, completed traces ::  46%|####5     | 14400/31509 [00:25<00:26, 643.53it/s]","\rparsing log, completed traces ::  46%|####5     | 14470/31509 [00:25<00:26, 655.34it/s]","\rparsing log, completed traces ::  46%|####6     | 14540/31509 [00:25<00:26, 644.93it/s]","\rparsing log, completed traces ::  46%|####6     | 14607/31509 [00:26<00:26, 647.03it/s]","\rparsing log, completed traces ::  47%|####6     | 14674/31509 [00:26<00:25, 652.64it/s]","\rparsing log, completed traces ::  47%|####6     | 14742/31509 [00:26<00:25, 660.09it/s]","\rparsing log, completed traces ::  47%|####7     | 14815/31509 [00:26<00:24, 680.35it/s]","\rparsing log, completed traces ::  47%|####7     | 14884/31509 [00:26<00:24, 671.30it/s]","\rparsing log, completed traces ::  47%|####7     | 14960/31509 [00:26<00:23, 696.48it/s]","\rparsing log, completed traces ::  48%|####7     | 15031/31509 [00:26<00:24, 678.24it/s]","\rparsing log, completed traces ::  48%|####7     | 15107/31509 [00:26<00:23, 697.41it/s]","\rparsing log, completed traces ::  48%|####8     | 15178/31509 [00:26<00:23, 700.51it/s]","\rparsing log, completed traces ::  48%|####8     | 15249/31509 [00:26<00:23, 698.17it/s]","\rparsing log, completed traces ::  49%|####8     | 15324/31509 [00:27<00:22, 713.20it/s]","\rparsing log, completed traces ::  49%|####8     | 15396/31509 [00:27<00:22, 714.61it/s]","\rparsing log, completed traces ::  49%|####9     | 15468/31509 [00:27<00:22, 713.99it/s]","\rparsing log, completed traces ::  49%|####9     | 15540/31509 [00:27<00:22, 713.06it/s]","\rparsing log, completed traces ::  50%|####9     | 15614/31509 [00:27<00:22, 719.46it/s]","\rparsing log, completed traces ::  50%|####9     | 15687/31509 [00:27<00:21, 721.88it/s]","\rparsing log, completed traces ::  50%|#####     | 15760/31509 [00:27<00:22, 710.80it/s]","\rparsing log, completed traces ::  50%|#####     | 15832/31509 [00:27<00:22, 699.35it/s]","\rparsing log, completed traces ::  50%|#####     | 15906/31509 [00:27<00:21, 709.53it/s]","\rparsing log, completed traces ::  51%|#####     | 15978/31509 [00:27<00:21, 709.33it/s]","\rparsing log, completed traces ::  51%|#####     | 16049/31509 [00:28<00:21, 704.42it/s]","\rparsing log, completed traces ::  51%|#####1    | 16123/31509 [00:28<00:21, 714.19it/s]","\rparsing log, completed traces ::  51%|#####1    | 16200/31509 [00:28<00:21, 728.73it/s]","\rparsing log, completed traces ::  52%|#####1    | 16273/31509 [00:28<00:21, 720.57it/s]","\rparsing log, completed traces ::  52%|#####1    | 16346/31509 [00:28<00:21, 713.38it/s]","\rparsing log, completed traces ::  52%|#####2    | 16418/31509 [00:28<00:21, 691.26it/s]","\rparsing log, completed traces ::  52%|#####2    | 16488/31509 [00:28<00:21, 686.71it/s]","\rparsing log, completed traces ::  53%|#####2    | 16557/31509 [00:28<00:21, 682.43it/s]","\rparsing log, completed traces ::  53%|#####2    | 16628/31509 [00:28<00:21, 685.69it/s]","\rparsing log, completed traces ::  53%|#####3    | 16703/31509 [00:28<00:21, 704.41it/s]","\rparsing log, completed traces ::  53%|#####3    | 16774/31509 [00:29<00:21, 690.80it/s]","\rparsing log, completed traces ::  53%|#####3    | 16844/31509 [00:29<00:21, 692.71it/s]","\rparsing log, completed traces ::  54%|#####3    | 16914/31509 [00:30<01:09, 209.18it/s]","\rparsing log, completed traces ::  54%|#####3    | 16983/31509 [00:30<00:55, 262.93it/s]","\rparsing log, completed traces ::  54%|#####4    | 17063/31509 [00:30<00:42, 336.87it/s]","\rparsing log, completed traces ::  54%|#####4    | 17127/31509 [00:30<00:37, 386.76it/s]","\rparsing log, completed traces ::  55%|#####4    | 17197/31509 [00:30<00:32, 445.92it/s]","\rparsing log, completed traces ::  55%|#####4    | 17265/31509 [00:30<00:28, 494.71it/s]","\rparsing log, completed traces ::  55%|#####5    | 17336/31509 [00:30<00:26, 544.50it/s]","\rparsing log, completed traces ::  55%|#####5    | 17407/31509 [00:30<00:24, 584.48it/s]","\rparsing log, completed traces ::  55%|#####5    | 17476/31509 [00:30<00:23, 609.65it/s]","\rparsing log, completed traces ::  56%|#####5    | 17545/31509 [00:31<00:22, 618.93it/s]","\rparsing log, completed traces ::  56%|#####5    | 17620/31509 [00:31<00:21, 652.06it/s]","\rparsing log, completed traces ::  56%|#####6    | 17691/31509 [00:31<00:20, 667.43it/s]","\rparsing log, completed traces ::  56%|#####6    | 17761/31509 [00:31<00:20, 674.19it/s]","\rparsing log, completed traces ::  57%|#####6    | 17831/31509 [00:31<00:20, 680.64it/s]","\rparsing log, completed traces ::  57%|#####6    | 17904/31509 [00:31<00:19, 693.42it/s]","\rparsing log, completed traces ::  57%|#####7    | 17975/31509 [00:31<00:19, 690.77it/s]","\rparsing log, completed traces ::  57%|#####7    | 18049/31509 [00:31<00:19, 704.97it/s]","\rparsing log, completed traces ::  58%|#####7    | 18121/31509 [00:31<00:18, 705.23it/s]","\rparsing log, completed traces ::  58%|#####7    | 18196/31509 [00:31<00:18, 716.18it/s]","\rparsing log, completed traces ::  58%|#####7    | 18268/31509 [00:32<00:18, 708.00it/s]","\rparsing log, completed traces ::  58%|#####8    | 18339/31509 [00:32<00:18, 696.86it/s]","\rparsing log, completed traces ::  58%|#####8    | 18410/31509 [00:32<00:18, 698.01it/s]","\rparsing log, completed traces ::  59%|#####8    | 18483/31509 [00:32<00:18, 701.92it/s]","\rparsing log, completed traces ::  59%|#####8    | 18554/31509 [00:32<00:19, 679.71it/s]","\rparsing log, completed traces ::  59%|#####9    | 18623/31509 [00:32<00:18, 682.06it/s]","\rparsing log, completed traces ::  59%|#####9    | 18706/31509 [00:32<00:17, 724.86it/s]","\rparsing log, completed traces ::  60%|#####9    | 18779/31509 [00:32<00:17, 712.98it/s]","\rparsing log, completed traces ::  60%|#####9    | 18851/31509 [00:32<00:17, 706.20it/s]","\rparsing log, completed traces ::  60%|######    | 18932/31509 [00:32<00:17, 734.08it/s]","\rparsing log, completed traces ::  60%|######    | 19006/31509 [00:33<00:17, 726.19it/s]","\rparsing log, completed traces ::  61%|######    | 19079/31509 [00:33<00:17, 721.81it/s]","\rparsing log, completed traces ::  61%|######    | 19155/31509 [00:33<00:16, 732.80it/s]","\rparsing log, completed traces ::  61%|######1   | 19229/31509 [00:33<00:17, 706.12it/s]","\rparsing log, completed traces ::  61%|######1   | 19303/31509 [00:33<00:17, 714.15it/s]","\rparsing log, completed traces ::  61%|######1   | 19377/31509 [00:33<00:16, 720.90it/s]","\rparsing log, completed traces ::  62%|######1   | 19452/31509 [00:33<00:16, 728.38it/s]","\rparsing log, completed traces ::  62%|######1   | 19525/31509 [00:33<00:16, 719.30it/s]","\rparsing log, completed traces ::  62%|######2   | 19598/31509 [00:33<00:16, 719.49it/s]","\rparsing log, completed traces ::  62%|######2   | 19671/31509 [00:33<00:16, 714.73it/s]","\rparsing log, completed traces ::  63%|######2   | 19743/31509 [00:34<00:16, 712.51it/s]","\rparsing log, completed traces ::  63%|######2   | 19815/31509 [00:34<00:16, 699.53it/s]","\rparsing log, completed traces ::  63%|######3   | 19886/31509 [00:34<00:16, 692.65it/s]","\rparsing log, completed traces ::  63%|######3   | 19956/31509 [00:34<00:16, 692.21it/s]","\rparsing log, completed traces ::  64%|######3   | 20026/31509 [00:34<00:16, 688.59it/s]","\rparsing log, completed traces ::  64%|######3   | 20095/31509 [00:34<00:16, 685.05it/s]","\rparsing log, completed traces ::  64%|######4   | 20166/31509 [00:34<00:16, 692.09it/s]","\rparsing log, completed traces ::  64%|######4   | 20240/31509 [00:34<00:15, 704.96it/s]","\rparsing log, completed traces ::  64%|######4   | 20314/31509 [00:34<00:15, 712.45it/s]","\rparsing log, completed traces ::  65%|######4   | 20386/31509 [00:35<00:15, 714.18it/s]","\rparsing log, completed traces ::  65%|######4   | 20462/31509 [00:35<00:54, 204.12it/s]","\rparsing log, completed traces ::  65%|######5   | 20535/31509 [00:36<00:42, 259.71it/s]","\rparsing log, completed traces ::  65%|######5   | 20611/31509 [00:36<00:33, 324.93it/s]","\rparsing log, completed traces ::  66%|######5   | 20688/31509 [00:36<00:27, 394.70it/s]","\rparsing log, completed traces ::  66%|######5   | 20766/31509 [00:36<00:23, 464.37it/s]","\rparsing log, completed traces ::  66%|######6   | 20837/31509 [00:36<00:20, 508.85it/s]","\rparsing log, completed traces ::  66%|######6   | 20909/31509 [00:36<00:19, 556.68it/s]","\rparsing log, completed traces ::  67%|######6   | 20979/31509 [00:36<00:17, 585.48it/s]","\rparsing log, completed traces ::  67%|######6   | 21049/31509 [00:36<00:17, 610.03it/s]","\rparsing log, completed traces ::  67%|######7   | 21118/31509 [00:36<00:16, 627.23it/s]","\rparsing log, completed traces ::  67%|######7   | 21189/31509 [00:36<00:15, 647.54it/s]","\rparsing log, completed traces ::  67%|######7   | 21265/31509 [00:37<00:15, 677.67it/s]","\rparsing log, completed traces ::  68%|######7   | 21336/31509 [00:37<00:14, 682.06it/s]","\rparsing log, completed traces ::  68%|######7   | 21407/31509 [00:37<00:14, 686.30it/s]","\rparsing log, completed traces ::  68%|######8   | 21483/31509 [00:37<00:14, 707.10it/s]","\rparsing log, completed traces ::  68%|######8   | 21560/31509 [00:37<00:13, 725.07it/s]","\rparsing log, completed traces ::  69%|######8   | 21634/31509 [00:37<00:13, 722.15it/s]","\rparsing log, completed traces ::  69%|######8   | 21707/31509 [00:37<00:13, 713.68it/s]","\rparsing log, completed traces ::  69%|######9   | 21786/31509 [00:37<00:13, 733.63it/s]","\rparsing log, completed traces ::  69%|######9   | 21864/31509 [00:37<00:12, 747.25it/s]","\rparsing log, completed traces ::  70%|######9   | 21939/31509 [00:38<00:12, 744.21it/s]","\rparsing log, completed traces ::  70%|######9   | 22014/31509 [00:38<00:12, 739.22it/s]","\rparsing log, completed traces ::  70%|#######   | 22090/31509 [00:38<00:12, 741.24it/s]","\rparsing log, completed traces ::  70%|#######   | 22171/31509 [00:38<00:12, 757.61it/s]","\rparsing log, completed traces ::  71%|#######   | 22247/31509 [00:38<00:12, 735.76it/s]","\rparsing log, completed traces ::  71%|#######   | 22321/31509 [00:38<00:12, 735.49it/s]","\rparsing log, completed traces ::  71%|#######1  | 22395/31509 [00:38<00:12, 730.03it/s]","\rparsing log, completed traces ::  71%|#######1  | 22474/31509 [00:38<00:12, 746.57it/s]","\rparsing log, completed traces ::  72%|#######1  | 22549/31509 [00:38<00:12, 732.85it/s]","\rparsing log, completed traces ::  72%|#######1  | 22623/31509 [00:38<00:12, 734.57it/s]","\rparsing log, completed traces ::  72%|#######2  | 22697/31509 [00:39<00:12, 723.80it/s]","\rparsing log, completed traces ::  72%|#######2  | 22774/31509 [00:39<00:11, 733.64it/s]","\rparsing log, completed traces ::  73%|#######2  | 22849/31509 [00:39<00:11, 736.25it/s]","\rparsing log, completed traces ::  73%|#######2  | 22923/31509 [00:39<00:11, 715.55it/s]","\rparsing log, completed traces ::  73%|#######2  | 22995/31509 [00:39<00:11, 712.24it/s]","\rparsing log, completed traces ::  73%|#######3  | 23067/31509 [00:39<00:11, 708.53it/s]","\rparsing log, completed traces ::  73%|#######3  | 23138/31509 [00:39<00:11, 704.39it/s]","\rparsing log, completed traces ::  74%|#######3  | 23209/31509 [00:39<00:11, 698.22it/s]","\rparsing log, completed traces ::  74%|#######3  | 23279/31509 [00:39<00:11, 696.01it/s]","\rparsing log, completed traces ::  74%|#######4  | 23349/31509 [00:39<00:11, 689.44it/s]","\rparsing log, completed traces ::  74%|#######4  | 23418/31509 [00:40<00:11, 688.59it/s]","\rparsing log, completed traces ::  75%|#######4  | 23487/31509 [00:40<00:11, 688.18it/s]","\rparsing log, completed traces ::  75%|#######4  | 23560/31509 [00:40<00:11, 699.52it/s]","\rparsing log, completed traces ::  75%|#######5  | 23634/31509 [00:40<00:11, 706.68it/s]","\rparsing log, completed traces ::  75%|#######5  | 23705/31509 [00:40<00:11, 706.63it/s]","\rparsing log, completed traces ::  75%|#######5  | 23777/31509 [00:40<00:10, 708.90it/s]","\rparsing log, completed traces ::  76%|#######5  | 23848/31509 [00:40<00:10, 708.41it/s]","\rparsing log, completed traces ::  76%|#######5  | 23919/31509 [00:40<00:10, 706.45it/s]","\rparsing log, completed traces ::  76%|#######6  | 23991/31509 [00:40<00:10, 709.68it/s]","\rparsing log, completed traces ::  76%|#######6  | 24062/31509 [00:40<00:10, 703.98it/s]","\rparsing log, completed traces ::  77%|#######6  | 24135/31509 [00:41<00:10, 709.14it/s]","\rparsing log, completed traces ::  77%|#######6  | 24206/31509 [00:41<00:10, 703.74it/s]","\rparsing log, completed traces ::  77%|#######7  | 24278/31509 [00:41<00:10, 707.42it/s]","\rparsing log, completed traces ::  77%|#######7  | 24355/31509 [00:41<00:09, 725.15it/s]","\rparsing log, completed traces ::  78%|#######7  | 24428/31509 [00:41<00:10, 701.55it/s]","\rparsing log, completed traces ::  78%|#######7  | 24504/31509 [00:41<00:09, 717.53it/s]","\rparsing log, completed traces ::  78%|#######7  | 24576/31509 [00:42<00:37, 184.77it/s]","\rparsing log, completed traces ::  78%|#######8  | 24653/31509 [00:42<00:28, 241.65it/s]","\rparsing log, completed traces ::  78%|#######8  | 24724/31509 [00:42<00:22, 298.73it/s]","\rparsing log, completed traces ::  79%|#######8  | 24795/31509 [00:42<00:18, 358.58it/s]","\rparsing log, completed traces ::  79%|#######8  | 24869/31509 [00:43<00:15, 423.93it/s]","\rparsing log, completed traces ::  79%|#######9  | 24941/31509 [00:43<00:13, 482.41it/s]","\rparsing log, completed traces ::  79%|#######9  | 25020/31509 [00:43<00:11, 550.12it/s]","\rparsing log, completed traces ::  80%|#######9  | 25092/31509 [00:43<00:11, 574.49it/s]","\rparsing log, completed traces ::  80%|#######9  | 25167/31509 [00:43<00:10, 617.63it/s]","\rparsing log, completed traces ::  80%|########  | 25239/31509 [00:43<00:09, 638.63it/s]","\rparsing log, completed traces ::  80%|########  | 25310/31509 [00:43<00:09, 639.63it/s]","\rparsing log, completed traces ::  81%|########  | 25385/31509 [00:43<00:09, 668.93it/s]","\rparsing log, completed traces ::  81%|########  | 25457/31509 [00:43<00:08, 683.16it/s]","\rparsing log, completed traces ::  81%|########1 | 25528/31509 [00:44<00:08, 690.54it/s]","\rparsing log, completed traces ::  81%|########1 | 25601/31509 [00:44<00:08, 699.98it/s]","\rparsing log, completed traces ::  81%|########1 | 25673/31509 [00:44<00:08, 692.85it/s]","\rparsing log, completed traces ::  82%|########1 | 25745/31509 [00:44<00:08, 695.51it/s]","\rparsing log, completed traces ::  82%|########1 | 25816/31509 [00:44<00:08, 684.85it/s]","\rparsing log, completed traces ::  82%|########2 | 25887/31509 [00:44<00:08, 690.93it/s]","\rparsing log, completed traces ::  82%|########2 | 25957/31509 [00:44<00:08, 692.08it/s]","\rparsing log, completed traces ::  83%|########2 | 26027/31509 [00:44<00:07, 685.54it/s]","\rparsing log, completed traces ::  83%|########2 | 26096/31509 [00:44<00:07, 677.98it/s]","\rparsing log, completed traces ::  83%|########3 | 26169/31509 [00:44<00:07, 691.93it/s]","\rparsing log, completed traces ::  83%|########3 | 26240/31509 [00:45<00:07, 695.63it/s]","\rparsing log, completed traces ::  84%|########3 | 26312/31509 [00:45<00:07, 702.22it/s]","\rparsing log, completed traces ::  84%|########3 | 26385/31509 [00:45<00:07, 708.99it/s]","\rparsing log, completed traces ::  84%|########3 | 26456/31509 [00:45<00:07, 702.15it/s]","\rparsing log, completed traces ::  84%|########4 | 26527/31509 [00:45<00:07, 694.29it/s]","\rparsing log, completed traces ::  84%|########4 | 26597/31509 [00:45<00:07, 675.13it/s]","\rparsing log, completed traces ::  85%|########4 | 26665/31509 [00:45<00:07, 674.16it/s]","\rparsing log, completed traces ::  85%|########4 | 26740/31509 [00:45<00:06, 695.31it/s]","\rparsing log, completed traces ::  85%|########5 | 26810/31509 [00:45<00:06, 680.94it/s]","\rparsing log, completed traces ::  85%|########5 | 26879/31509 [00:45<00:06, 678.76it/s]","\rparsing log, completed traces ::  86%|########5 | 26950/31509 [00:46<00:06, 687.12it/s]","\rparsing log, completed traces ::  86%|########5 | 27019/31509 [00:46<00:06, 673.04it/s]","\rparsing log, completed traces ::  86%|########5 | 27087/31509 [00:46<00:06, 670.56it/s]","\rparsing log, completed traces ::  86%|########6 | 27160/31509 [00:46<00:06, 687.10it/s]","\rparsing log, completed traces ::  86%|########6 | 27233/31509 [00:46<00:06, 697.42it/s]","\rparsing log, completed traces ::  87%|########6 | 27303/31509 [00:46<00:06, 695.22it/s]","\rparsing log, completed traces ::  87%|########6 | 27373/31509 [00:46<00:05, 691.40it/s]","\rparsing log, completed traces ::  87%|########7 | 27443/31509 [00:46<00:05, 692.97it/s]","\rparsing log, completed traces ::  87%|########7 | 27513/31509 [00:46<00:05, 689.35it/s]","\rparsing log, completed traces ::  88%|########7 | 27587/31509 [00:46<00:05, 700.79it/s]","\rparsing log, completed traces ::  88%|########7 | 27661/31509 [00:47<00:05, 711.00it/s]","\rparsing log, completed traces ::  88%|########8 | 27738/31509 [00:47<00:05, 727.28it/s]","\rparsing log, completed traces ::  88%|########8 | 27811/31509 [00:47<00:05, 710.60it/s]","\rparsing log, completed traces ::  88%|########8 | 27883/31509 [00:47<00:05, 705.14it/s]","\rparsing log, completed traces ::  89%|########8 | 27954/31509 [00:47<00:05, 701.34it/s]","\rparsing log, completed traces ::  89%|########8 | 28025/31509 [00:47<00:04, 700.25it/s]","\rparsing log, completed traces ::  89%|########9 | 28096/31509 [00:47<00:04, 687.90it/s]","\rparsing log, completed traces ::  89%|########9 | 28165/31509 [00:47<00:04, 680.21it/s]","\rparsing log, completed traces ::  90%|########9 | 28239/31509 [00:47<00:04, 695.02it/s]","\rparsing log, completed traces ::  90%|########9 | 28309/31509 [00:48<00:04, 685.75it/s]","\rparsing log, completed traces ::  90%|######### | 28382/31509 [00:48<00:04, 698.02it/s]","\rparsing log, completed traces ::  90%|######### | 28452/31509 [00:48<00:04, 684.64it/s]","\rparsing log, completed traces ::  91%|######### | 28526/31509 [00:48<00:04, 700.41it/s]","\rparsing log, completed traces ::  91%|######### | 28601/31509 [00:48<00:04, 714.28it/s]","\rparsing log, completed traces ::  91%|######### | 28673/31509 [00:48<00:04, 702.50it/s]","\rparsing log, completed traces ::  91%|#########1| 28744/31509 [00:48<00:04, 667.51it/s]","\rparsing log, completed traces ::  91%|#########1| 28812/31509 [00:48<00:04, 666.17it/s]","\rparsing log, completed traces ::  92%|#########1| 28879/31509 [00:48<00:04, 646.55it/s]","\rparsing log, completed traces ::  92%|#########1| 28948/31509 [00:50<00:16, 155.88it/s]","\rparsing log, completed traces ::  92%|#########2| 29017/31509 [00:50<00:12, 202.58it/s]","\rparsing log, completed traces ::  92%|#########2| 29083/31509 [00:50<00:09, 252.99it/s]","\rparsing log, completed traces ::  93%|#########2| 29150/31509 [00:50<00:07, 310.05it/s]","\rparsing log, completed traces ::  93%|#########2| 29223/31509 [00:50<00:06, 378.18it/s]","\rparsing log, completed traces ::  93%|#########2| 29293/31509 [00:50<00:05, 438.06it/s]","\rparsing log, completed traces ::  93%|#########3| 29359/31509 [00:50<00:04, 484.42it/s]","\rparsing log, completed traces ::  93%|#########3| 29425/31509 [00:50<00:03, 523.29it/s]","\rparsing log, completed traces ::  94%|#########3| 29491/31509 [00:50<00:03, 549.27it/s]","\rparsing log, completed traces ::  94%|#########3| 29556/31509 [00:51<00:03, 561.80it/s]","\rparsing log, completed traces ::  94%|#########4| 29631/31509 [00:51<00:03, 611.04it/s]","\rparsing log, completed traces ::  94%|#########4| 29701/31509 [00:51<00:02, 634.93it/s]","\rparsing log, completed traces ::  94%|#########4| 29769/31509 [00:51<00:02, 647.39it/s]","\rparsing log, completed traces ::  95%|#########4| 29837/31509 [00:51<00:02, 650.25it/s]","\rparsing log, completed traces ::  95%|#########4| 29907/31509 [00:51<00:02, 663.17it/s]","\rparsing log, completed traces ::  95%|#########5| 29977/31509 [00:51<00:02, 672.04it/s]","\rparsing log, completed traces ::  95%|#########5| 30046/31509 [00:51<00:02, 672.77it/s]","\rparsing log, completed traces ::  96%|#########5| 30116/31509 [00:51<00:02, 680.02it/s]","\rparsing log, completed traces ::  96%|#########5| 30185/31509 [00:51<00:01, 680.04it/s]","\rparsing log, completed traces ::  96%|#########6| 30258/31509 [00:52<00:01, 692.55it/s]","\rparsing log, completed traces ::  96%|#########6| 30331/31509 [00:52<00:01, 701.09it/s]","\rparsing log, completed traces ::  96%|#########6| 30405/31509 [00:52<00:01, 711.29it/s]","\rparsing log, completed traces ::  97%|#########6| 30477/31509 [00:52<00:01, 697.93it/s]","\rparsing log, completed traces ::  97%|#########6| 30547/31509 [00:52<00:01, 697.38it/s]","\rparsing log, completed traces ::  97%|#########7| 30623/31509 [00:52<00:01, 715.60it/s]","\rparsing log, completed traces ::  97%|#########7| 30695/31509 [00:52<00:01, 710.26it/s]","\rparsing log, completed traces ::  98%|#########7| 30767/31509 [00:52<00:01, 709.22it/s]","\rparsing log, completed traces ::  98%|#########7| 30840/31509 [00:52<00:00, 713.87it/s]","\rparsing log, completed traces ::  98%|#########8| 30912/31509 [00:52<00:00, 699.70it/s]","\rparsing log, completed traces ::  98%|#########8| 30983/31509 [00:53<00:00, 696.44it/s]","\rparsing log, completed traces ::  99%|#########8| 31057/31509 [00:53<00:00, 707.15it/s]","\rparsing log, completed traces ::  99%|#########8| 31129/31509 [00:53<00:00, 709.80it/s]","\rparsing log, completed traces ::  99%|#########9| 31206/31509 [00:53<00:00, 726.76it/s]","\rparsing log, completed traces ::  99%|#########9| 31279/31509 [00:53<00:00, 685.20it/s]","\rparsing log, completed traces ::  99%|#########9| 31349/31509 [00:53<00:00, 672.31it/s]","\rparsing log, completed traces :: 100%|#########9| 31421/31509 [00:53<00:00, 684.36it/s]","\rparsing log, completed traces :: 100%|#########9| 31490/31509 [00:53<00:00, 677.18it/s]","","\rparsing log, completed traces :: 100%|##########| 31509/31509 [00:53<00:00, 585.20it/s]","\n","[data] Loading XES: /workspace/data/Road_Traffic_Fine_Management_Process.xes","\n","\rparsing log, completed traces ::   0%|          | 0/150370 [00:00<?, ?it/s]","\rparsing log, completed traces ::   1%|          | 766/150370 [00:00<00:19, 7655.88it/s]","\rparsing log, completed traces ::   1%|1         | 1606/150370 [00:00<00:18, 8091.67it/s]","\rparsing log, completed traces ::   2%|1         | 2416/150370 [00:00<00:44, 3323.05it/s]","\rparsing log, completed traces ::   2%|2         | 3230/150370 [00:00<00:33, 4340.17it/s]","\rparsing log, completed traces ::   3%|2         | 4058/150370 [00:00<00:27, 5253.03it/s]","\rparsing log, completed traces ::   3%|3         | 4885/150370 [00:00<00:24, 6003.26it/s]","\rparsing log, completed traces ::   4%|3         | 5698/150370 [00:01<00:22, 6560.17it/s]","\rparsing log, completed traces ::   4%|4         | 6518/150370 [00:01<00:20, 6997.61it/s]","\rparsing log, completed traces ::   5%|4         | 7328/150370 [00:01<00:19, 7305.26it/s]","\rparsing log, completed traces ::   5%|5         | 8188/150370 [00:01<00:18, 7651.98it/s]","\rparsing log, completed traces ::   6%|6         | 9071/150370 [00:01<00:17, 7990.79it/s]","\rparsing log, completed traces ::   7%|6         | 9915/150370 [00:01<00:17, 8119.30it/s]","\rparsing log, completed traces ::   7%|7         | 10751/150370 [00:01<00:17, 8165.91it/s]","\rparsing log, completed traces ::   8%|7         | 11603/150370 [00:01<00:16, 8249.28it/s]","\rparsing log, completed traces ::   8%|8         | 12440/150370 [00:01<00:16, 8219.02it/s]","\rparsing log, completed traces ::   9%|8         | 13273/150370 [00:01<00:16, 8246.79it/s]","\rparsing log, completed traces ::   9%|9         | 14104/150370 [00:02<00:16, 8192.28it/s]","\rparsing log, completed traces ::  10%|9         | 14946/150370 [00:02<00:16, 8257.11it/s]","\rparsing log, completed traces ::  10%|#         | 15775/150370 [00:02<00:34, 3877.98it/s]","\rparsing log, completed traces ::  11%|#1        | 16636/150370 [00:02<00:28, 4663.23it/s]","\rparsing log, completed traces ::  12%|#1        | 17497/150370 [00:02<00:24, 5418.77it/s]","\rparsing log, completed traces ::  12%|#2        | 18330/150370 [00:02<00:21, 6043.84it/s]","\rparsing log, completed traces ::  13%|#2        | 19196/150370 [00:03<00:19, 6657.22it/s]","\rparsing log, completed traces ::  13%|#3        | 20030/150370 [00:03<00:18, 7079.73it/s]","\rparsing log, completed traces ::  14%|#3        | 20887/150370 [00:03<00:17, 7454.93it/s]","\rparsing log, completed traces ::  15%|#4        | 21812/150370 [00:03<00:16, 7923.10it/s]","\rparsing log, completed traces ::  15%|#5        | 22725/150370 [00:03<00:15, 8259.70it/s]","\rparsing log, completed traces ::  16%|#5        | 23594/150370 [00:03<00:15, 8343.80it/s]","\rparsing log, completed traces ::  16%|#6        | 24459/150370 [00:03<00:16, 7844.37it/s]","\rparsing log, completed traces ::  17%|#6        | 25271/150370 [00:03<00:16, 7621.19it/s]","\rparsing log, completed traces ::  17%|#7        | 26053/150370 [00:03<00:16, 7424.54it/s]","\rparsing log, completed traces ::  18%|#7        | 26809/150370 [00:03<00:17, 7176.63it/s]","\rparsing log, completed traces ::  18%|#8        | 27537/150370 [00:04<00:17, 7026.91it/s]","\rparsing log, completed traces ::  19%|#8        | 28247/150370 [00:04<00:17, 7012.69it/s]","\rparsing log, completed traces ::  19%|#9        | 29051/150370 [00:04<00:16, 7301.23it/s]","\rparsing log, completed traces ::  20%|#9        | 29845/150370 [00:04<00:16, 7483.88it/s]","\rparsing log, completed traces ::  20%|##        | 30598/150370 [00:04<00:36, 3276.63it/s]","\rparsing log, completed traces ::  21%|##        | 31297/150370 [00:05<00:30, 3847.46it/s]","\rparsing log, completed traces ::  21%|##1       | 31992/150370 [00:05<00:26, 4406.06it/s]","\rparsing log, completed traces ::  22%|##1       | 32700/150370 [00:05<00:23, 4952.92it/s]","\rparsing log, completed traces ::  22%|##2       | 33415/150370 [00:05<00:21, 5443.55it/s]","\rparsing log, completed traces ::  23%|##2       | 34140/150370 [00:05<00:19, 5882.99it/s]","\rparsing log, completed traces ::  23%|##3       | 34837/150370 [00:05<00:18, 6162.92it/s]","\rparsing log, completed traces ::  24%|##3       | 35549/150370 [00:05<00:17, 6419.79it/s]","\rparsing log, completed traces ::  24%|##4       | 36256/150370 [00:05<00:17, 6583.40it/s]","\rparsing log, completed traces ::  25%|##4       | 36993/150370 [00:05<00:16, 6805.29it/s]","\rparsing log, completed traces ::  25%|##5       | 37721/150370 [00:05<00:16, 6942.09it/s]","\rparsing log, completed traces ::  26%|##5       | 38463/150370 [00:06<00:15, 7064.64it/s]","\rparsing log, completed traces ::  26%|##6       | 39225/150370 [00:06<00:15, 7227.42it/s]","\rparsing log, completed traces ::  27%|##6       | 39992/150370 [00:06<00:15, 7356.54it/s]","\rparsing log, completed traces ::  27%|##7       | 40749/150370 [00:06<00:14, 7418.12it/s]","\rparsing log, completed traces ::  28%|##7       | 41535/150370 [00:06<00:14, 7533.34it/s]","\rparsing log, completed traces ::  28%|##8       | 42335/150370 [00:06<00:14, 7670.38it/s]","\rparsing log, completed traces ::  29%|##8       | 43114/150370 [00:06<00:13, 7705.92it/s]","\rparsing log, completed traces ::  29%|##9       | 43887/150370 [00:06<00:13, 7701.43it/s]","\rparsing log, completed traces ::  30%|##9       | 44663/150370 [00:06<00:13, 7718.23it/s]","\rparsing log, completed traces ::  30%|###       | 45436/150370 [00:06<00:13, 7642.61it/s]","\rparsing log, completed traces ::  31%|###       | 46202/150370 [00:07<00:13, 7591.50it/s]","\rparsing log, completed traces ::  31%|###1      | 46962/150370 [00:07<00:33, 3048.85it/s]","\rparsing log, completed traces ::  32%|###1      | 47685/150370 [00:07<00:28, 3655.04it/s]","\rparsing log, completed traces ::  32%|###2      | 48490/150370 [00:07<00:23, 4408.81it/s]","\rparsing log, completed traces ::  33%|###2      | 49350/150370 [00:07<00:19, 5233.05it/s]","\rparsing log, completed traces ::  33%|###3      | 50130/150370 [00:08<00:17, 5796.42it/s]","\rparsing log, completed traces ::  34%|###3      | 50885/150370 [00:08<00:16, 6214.52it/s]","\rparsing log, completed traces ::  34%|###4      | 51661/150370 [00:08<00:14, 6606.06it/s]","\rparsing log, completed traces ::  35%|###4      | 52420/150370 [00:08<00:14, 6865.11it/s]","\rparsing log, completed traces ::  35%|###5      | 53186/150370 [00:08<00:13, 7082.87it/s]","\rparsing log, completed traces ::  36%|###5      | 53952/150370 [00:08<00:13, 7244.59it/s]","\rparsing log, completed traces ::  36%|###6      | 54781/150370 [00:08<00:12, 7544.67it/s]","\rparsing log, completed traces ::  37%|###6      | 55563/150370 [00:08<00:12, 7610.24it/s]","\rparsing log, completed traces ::  37%|###7      | 56377/150370 [00:08<00:12, 7764.56it/s]","\rparsing log, completed traces ::  38%|###8      | 57202/150370 [00:08<00:11, 7906.17it/s]","\rparsing log, completed traces ::  39%|###8      | 58003/150370 [00:09<00:11, 7901.03it/s]","\rparsing log, completed traces ::  39%|###9      | 58800/150370 [00:09<00:11, 7896.33it/s]","\rparsing log, completed traces ::  40%|###9      | 59613/150370 [00:09<00:11, 7940.78it/s]","\rparsing log, completed traces ::  40%|####      | 60415/150370 [00:09<00:11, 7945.67it/s]","\rparsing log, completed traces ::  41%|####      | 61298/150370 [00:09<00:10, 8207.80it/s]","\rparsing log, completed traces ::  41%|####1     | 62195/150370 [00:09<00:10, 8434.16it/s]","\rparsing log, completed traces ::  42%|####1     | 63040/150370 [00:09<00:10, 8360.68it/s]","\rparsing log, completed traces ::  42%|####2     | 63878/150370 [00:09<00:10, 8241.81it/s]","\rparsing log, completed traces ::  43%|####3     | 64705/150370 [00:09<00:10, 8235.76it/s]","\rparsing log, completed traces ::  44%|####3     | 65540/150370 [00:09<00:10, 8269.33it/s]","\rparsing log, completed traces ::  44%|####4     | 66388/150370 [00:10<00:10, 8331.45it/s]","\rparsing log, completed traces ::  45%|####4     | 67222/150370 [00:10<00:27, 3057.95it/s]","\rparsing log, completed traces ::  45%|####5     | 68114/150370 [00:10<00:21, 3849.56it/s]","\rparsing log, completed traces ::  46%|####5     | 68958/150370 [00:10<00:17, 4592.16it/s]","\rparsing log, completed traces ::  46%|####6     | 69770/150370 [00:11<00:15, 5253.92it/s]","\rparsing log, completed traces ::  47%|####6     | 70581/150370 [00:11<00:13, 5857.78it/s]","\rparsing log, completed traces ::  47%|####7     | 71397/150370 [00:11<00:12, 6390.77it/s]","\rparsing log, completed traces ::  48%|####8     | 72203/150370 [00:11<00:11, 6804.73it/s]","\rparsing log, completed traces ::  49%|####8     | 72998/150370 [00:11<00:10, 7071.26it/s]","\rparsing log, completed traces ::  49%|####9     | 73789/150370 [00:11<00:10, 7217.69it/s]","\rparsing log, completed traces ::  50%|####9     | 74703/150370 [00:11<00:09, 7750.39it/s]","\rparsing log, completed traces ::  50%|#####     | 75524/150370 [00:11<00:09, 7879.67it/s]","\rparsing log, completed traces ::  51%|#####     | 76383/150370 [00:11<00:09, 8083.33it/s]","\rparsing log, completed traces ::  51%|#####1    | 77216/150370 [00:11<00:09, 8110.04it/s]","\rparsing log, completed traces ::  52%|#####1    | 78044/150370 [00:12<00:08, 8041.26it/s]","\rparsing log, completed traces ::  52%|#####2    | 78860/150370 [00:12<00:08, 8009.50it/s]","\rparsing log, completed traces ::  53%|#####2    | 79670/150370 [00:12<00:08, 7987.03it/s]","\rparsing log, completed traces ::  54%|#####3    | 80477/150370 [00:12<00:08, 8008.01it/s]","\rparsing log, completed traces ::  54%|#####4    | 81282/150370 [00:12<00:08, 7999.62it/s]","\rparsing log, completed traces ::  55%|#####4    | 82121/150370 [00:12<00:08, 8115.21it/s]","\rparsing log, completed traces ::  55%|#####5    | 82980/150370 [00:12<00:08, 8255.84it/s]","\rparsing log, completed traces ::  56%|#####5    | 83808/150370 [00:12<00:08, 8246.60it/s]","\rparsing log, completed traces ::  56%|#####6    | 84634/150370 [00:12<00:08, 8171.45it/s]","\rparsing log, completed traces ::  57%|#####6    | 85453/150370 [00:12<00:07, 8141.07it/s]","\rparsing log, completed traces ::  57%|#####7    | 86275/150370 [00:13<00:07, 8163.09it/s]","\rparsing log, completed traces ::  58%|#####7    | 87099/150370 [00:13<00:07, 8184.51it/s]","\rparsing log, completed traces ::  58%|#####8    | 87927/150370 [00:13<00:07, 8212.85it/s]","\rparsing log, completed traces ::  59%|#####9    | 88756/150370 [00:13<00:07, 8235.54it/s]","\rparsing log, completed traces ::  60%|#####9    | 89580/150370 [00:13<00:07, 8182.03it/s]","\rparsing log, completed traces ::  60%|######    | 90420/150370 [00:13<00:07, 8246.47it/s]","\rparsing log, completed traces ::  61%|######    | 91245/150370 [00:14<00:21, 2788.52it/s]","\rparsing log, completed traces ::  61%|######1   | 92074/150370 [00:14<00:16, 3481.95it/s]","\rparsing log, completed traces ::  62%|######1   | 92898/150370 [00:14<00:13, 4203.23it/s]","\rparsing log, completed traces ::  62%|######2   | 93731/150370 [00:14<00:11, 4940.92it/s]","\rparsing log, completed traces ::  63%|######2   | 94589/150370 [00:14<00:09, 5673.57it/s]","\rparsing log, completed traces ::  63%|######3   | 95444/150370 [00:14<00:08, 6320.45it/s]","\rparsing log, completed traces ::  64%|######4   | 96274/150370 [00:14<00:07, 6800.36it/s]","\rparsing log, completed traces ::  65%|######4   | 97093/150370 [00:15<00:07, 7157.92it/s]","\rparsing log, completed traces ::  65%|######5   | 97909/150370 [00:15<00:07, 7426.92it/s]","\rparsing log, completed traces ::  66%|######5   | 98739/150370 [00:15<00:06, 7667.18it/s]","\rparsing log, completed traces ::  66%|######6   | 99558/150370 [00:15<00:06, 7795.22it/s]","\rparsing log, completed traces ::  67%|######6   | 100375/150370 [00:15<00:06, 7880.06it/s]","\rparsing log, completed traces ::  67%|######7   | 101201/150370 [00:15<00:06, 7990.36it/s]","\rparsing log, completed traces ::  68%|######7   | 102047/150370 [00:15<00:05, 8127.44it/s]","\rparsing log, completed traces ::  68%|######8   | 102874/150370 [00:15<00:05, 8132.85it/s]","\rparsing log, completed traces ::  69%|######8   | 103697/150370 [00:15<00:05, 8136.78it/s]","\rparsing log, completed traces ::  70%|######9   | 104518/150370 [00:15<00:05, 8095.24it/s]","\rparsing log, completed traces ::  70%|#######   | 105333/150370 [00:16<00:05, 8087.24it/s]","\rparsing log, completed traces ::  71%|#######   | 106145/150370 [00:16<00:05, 8027.34it/s]","\rparsing log, completed traces ::  71%|#######1  | 106951/150370 [00:16<00:05, 8028.40it/s]","\rparsing log, completed traces ::  72%|#######1  | 107756/150370 [00:16<00:05, 7996.44it/s]","\rparsing log, completed traces ::  72%|#######2  | 108557/150370 [00:16<00:05, 7964.82it/s]","\rparsing log, completed traces ::  73%|#######2  | 109355/150370 [00:16<00:05, 7968.72it/s]","\rparsing log, completed traces ::  73%|#######3  | 110154/150370 [00:16<00:05, 7974.28it/s]","\rparsing log, completed traces ::  74%|#######3  | 110952/150370 [00:16<00:04, 7962.98it/s]","\rparsing log, completed traces ::  74%|#######4  | 111761/150370 [00:16<00:04, 7976.12it/s]","\rparsing log, completed traces ::  75%|#######4  | 112559/150370 [00:16<00:04, 7908.56it/s]","\rparsing log, completed traces ::  75%|#######5  | 113351/150370 [00:17<00:04, 7844.06it/s]","\rparsing log, completed traces ::  76%|#######6  | 114314/150370 [00:17<00:04, 8372.78it/s]","\rparsing log, completed traces ::  77%|#######6  | 115307/150370 [00:17<00:03, 8835.64it/s]","\rparsing log, completed traces ::  77%|#######7  | 116271/150370 [00:17<00:03, 9055.94it/s]","\rparsing log, completed traces ::  78%|#######8  | 117377/150370 [00:17<00:03, 9651.85it/s]","\rparsing log, completed traces ::  79%|#######8  | 118344/150370 [00:17<00:03, 8896.44it/s]","\rparsing log, completed traces ::  79%|#######9  | 119246/150370 [00:18<00:11, 2829.20it/s]","\rparsing log, completed traces ::  80%|#######9  | 120000/150370 [00:18<00:09, 3362.44it/s]","\rparsing log, completed traces ::  80%|########  | 120739/150370 [00:18<00:07, 3922.48it/s]","\rparsing log, completed traces ::  81%|########  | 121491/150370 [00:18<00:06, 4518.73it/s]","\rparsing log, completed traces ::  81%|########1 | 122254/150370 [00:18<00:05, 5113.88it/s]","\rparsing log, completed traces ::  82%|########1 | 123002/150370 [00:18<00:04, 5611.72it/s]","\rparsing log, completed traces ::  82%|########2 | 123757/150370 [00:19<00:04, 6066.13it/s]","\rparsing log, completed traces ::  83%|########2 | 124498/150370 [00:19<00:04, 6363.64it/s]","\rparsing log, completed traces ::  83%|########3 | 125250/150370 [00:19<00:03, 6666.41it/s]","\rparsing log, completed traces ::  84%|########3 | 126015/150370 [00:19<00:03, 6929.45it/s]","\rparsing log, completed traces ::  84%|########4 | 126796/150370 [00:19<00:03, 7155.65it/s]","\rparsing log, completed traces ::  85%|########4 | 127565/150370 [00:19<00:03, 7293.52it/s]","\rparsing log, completed traces ::  85%|########5 | 128330/150370 [00:19<00:02, 7395.64it/s]","\rparsing log, completed traces ::  86%|########5 | 129117/150370 [00:19<00:02, 7533.15it/s]","\rparsing log, completed traces ::  86%|########6 | 129900/150370 [00:19<00:02, 7600.52it/s]","\rparsing log, completed traces ::  87%|########6 | 130679/150370 [00:19<00:02, 7644.00it/s]","\rparsing log, completed traces ::  87%|########7 | 131466/150370 [00:20<00:02, 7710.12it/s]","\rparsing log, completed traces ::  88%|########8 | 132387/150370 [00:20<00:02, 8142.52it/s]","\rparsing log, completed traces ::  89%|########8 | 133253/150370 [00:20<00:02, 8276.22it/s]","\rparsing log, completed traces ::  89%|########9 | 134084/150370 [00:20<00:01, 8214.69it/s]","\rparsing log, completed traces ::  90%|########9 | 134908/150370 [00:20<00:01, 8095.95it/s]","\rparsing log, completed traces ::  90%|######### | 135720/150370 [00:20<00:01, 8002.45it/s]","\rparsing log, completed traces ::  91%|######### | 136522/150370 [00:20<00:01, 7926.37it/s]","\rparsing log, completed traces ::  91%|#########1| 137316/150370 [00:20<00:01, 7800.27it/s]","\rparsing log, completed traces ::  92%|#########1| 138097/150370 [00:20<00:01, 7769.05it/s]","\rparsing log, completed traces ::  92%|#########2| 138875/150370 [00:20<00:01, 7765.75it/s]","\rparsing log, completed traces ::  93%|#########2| 139652/150370 [00:21<00:01, 7763.48it/s]","\rparsing log, completed traces ::  93%|#########3| 140460/150370 [00:21<00:01, 7833.57it/s]","\rparsing log, completed traces ::  94%|#########3| 141257/150370 [00:21<00:01, 7872.23it/s]","\rparsing log, completed traces ::  94%|#########4| 142059/150370 [00:21<00:01, 7911.11it/s]","\rparsing log, completed traces ::  95%|#########4| 142851/150370 [00:21<00:00, 7873.58it/s]","\rparsing log, completed traces ::  96%|#########5| 143639/150370 [00:21<00:00, 7867.71it/s]","\rparsing log, completed traces ::  96%|#########6| 144431/150370 [00:21<00:00, 7882.95it/s]","\rparsing log, completed traces ::  97%|#########6| 145220/150370 [00:21<00:00, 7638.33it/s]","\rparsing log, completed traces ::  97%|#########7| 145986/150370 [00:21<00:00, 7187.64it/s]","\rparsing log, completed traces ::  98%|#########7| 146711/150370 [00:22<00:00, 6916.43it/s]","\rparsing log, completed traces ::  98%|#########8| 147408/150370 [00:22<00:00, 6672.73it/s]","\rparsing log, completed traces ::  98%|#########8| 148080/150370 [00:23<00:01, 1981.38it/s]","\rparsing log, completed traces ::  99%|#########8| 148742/150370 [00:23<00:00, 2468.54it/s]","\rparsing log, completed traces ::  99%|#########9| 149436/150370 [00:23<00:00, 3051.73it/s]","\rparsing log, completed traces :: 100%|#########9| 150171/150370 [00:23<00:00, 3726.59it/s]","","\rparsing log, completed traces :: 100%|##########| 150370/150370 [00:23<00:00, 6421.20it/s]","\n","[data] Loaded datasets: ['BPI2012', 'BPI2017', 'ROAD']","\n","\n=== Dataset: BPI2012 ===","\n","Samples train/val/test: 22252/4176/4196; vocab=23","\n","Epoch 1: validation_loss = 0.5594 | val_acc=0.7409 | val_f1=0.5316 | val_top3=0.9840","\n","Epoch 2: validation_loss = 0.5308 | val_acc=0.7598 | val_f1=0.5425 | val_top3=0.9854","\n","Epoch 3: validation_loss = 0.5333 | val_acc=0.7574 | val_f1=0.5725 | val_top3=0.9859","\n","Epoch 4: validation_loss = 0.5195 | val_acc=0.7629 | val_f1=0.5835 | val_top3=0.9861","\n","Epoch 5: validation_loss = 0.5221 | val_acc=0.7450 | val_f1=0.6007 | val_top3=0.9854","\n","Epoch 6: validation_loss = 0.5249 | val_acc=0.7634 | val_f1=0.5833 | val_top3=0.9861","\n","Epoch 7: validation_loss = 0.5073 | val_acc=0.7639 | val_f1=0.5909 | val_top3=0.9856","\n","Epoch 8: validation_loss = 0.5113 | val_acc=0.7593 | val_f1=0.5790 | val_top3=0.9859","\n","Epoch 9: validation_loss = 0.5105 | val_acc=0.7639 | val_f1=0.5842 | val_top3=0.9852","\n","Epoch 10: validation_loss = 0.5201 | val_acc=0.7634 | val_f1=0.5797 | val_top3=0.9847","\n","[BPI2012] Train: loss=0.5148 acc=0.7777 f1=0.5609 top3=0.9868","\n","[BPI2012] Test:  loss=0.5355 acc=0.7569 f1=0.5872 top3=0.9874","\n","\n=== Dataset: BPI2017 ===","\n","Samples train/val/test: 34519/7403/7374; vocab=24","\n","Epoch 1: validation_loss = 0.4172 | val_acc=0.8368 | val_f1=0.5299 | val_top3=0.9904","\n","Epoch 2: validation_loss = 0.4004 | val_acc=0.8367 | val_f1=0.5595 | val_top3=0.9907","\n","Epoch 3: validation_loss = 0.3864 | val_acc=0.8384 | val_f1=0.5719 | val_top3=0.9912","\n","Epoch 4: validation_loss = 0.3847 | val_acc=0.8395 | val_f1=0.5903 | val_top3=0.9919","\n","Epoch 5: validation_loss = 0.3812 | val_acc=0.8405 | val_f1=0.5856 | val_top3=0.9922","\n","Epoch 6: validation_loss = 0.3802 | val_acc=0.8376 | val_f1=0.5896 | val_top3=0.9916","\n","Epoch 7: validation_loss = 0.3769 | val_acc=0.8361 | val_f1=0.5957 | val_top3=0.9924","\n","Epoch 8: validation_loss = 0.3799 | val_acc=0.8386 | val_f1=0.6180 | val_top3=0.9927","\n","Epoch 9: validation_loss = 0.3805 | val_acc=0.8391 | val_f1=0.5989 | val_top3=0.9926","\n","Epoch 10: validation_loss = 0.3756 | val_acc=0.8399 | val_f1=0.6155 | val_top3=0.9928","\n","[BPI2017] Train: loss=0.3607 acc=0.8422 f1=0.5721 top3=0.9941","\n","[BPI2017] Test:  loss=0.3877 acc=0.8332 f1=0.5710 top3=0.9906","\n","\n=== Dataset: ROAD ===","\n","Samples train/val/test: 8707/1928/1869; vocab=11","\n","Epoch 1: validation_loss = 0.4913 | val_acc=0.7993 | val_f1=0.3684 | val_top3=0.9922","\n","Epoch 2: validation_loss = 0.4561 | val_acc=0.8086 | val_f1=0.4514 | val_top3=0.9948","\n","Epoch 3: validation_loss = 0.4566 | val_acc=0.8091 | val_f1=0.5300 | val_top3=0.9969","\n","Epoch 4: validation_loss = 0.4482 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 5: validation_loss = 0.4355 | val_acc=0.8112 | val_f1=0.6427 | val_top3=0.9969","\n","Epoch 6: validation_loss = 0.4334 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 7: validation_loss = 0.4328 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 8: validation_loss = 0.4334 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 9: validation_loss = 0.4274 | val_acc=0.8117 | val_f1=0.6438 | val_top3=0.9969","\n","Epoch 10: validation_loss = 0.4329 | val_acc=0.8122 | val_f1=0.6664 | val_top3=0.9969","\n","[ROAD] Train: loss=0.4662 acc=0.7894 f1=0.5395 top3=0.9986","\n","[ROAD] Test:  loss=0.4833 acc=0.8020 f1=0.4740 top3=0.9936","\n","Execution time: 3 minutes seconds (time limit is an hour)."],"parse_metrics_plan":"I will load the numpy file from the specified working directory, parse the nested experiment_data structure, and compute final or best metrics as requested. For training and test, I will report the final metrics saved in the structure. For validation, I will compute the best values across epochs for accuracy, F1 score, and top-3 accuracy, and the minimum validation loss using the recorded loss history. The script prints the dataset name followed by clearly labeled metrics and executes immediately.","parse_metrics_code":"import os\nimport numpy as np\n\n\ndef safe_get(d, *keys, default=None):\n    cur = d\n    for k in keys:\n        if isinstance(cur, dict) and k in cur:\n            cur = cur[k]\n        else:\n            return default\n    return cur\n\n\ndef load_experiment_data():\n    working_dir = os.path.join(os.getcwd(), \"working\")\n    path = os.path.join(working_dir, \"experiment_data.npy\")\n    if not os.path.isfile(path):\n        raise FileNotFoundError(f\"File not found: {path}\")\n    data = np.load(path, allow_pickle=True).item()\n    if not isinstance(data, dict):\n        raise ValueError(\"Loaded experiment_data is not a dict.\")\n    return data\n\n\ndef extract_final_train_metrics(ds_data):\n    # Expect a 'final' entry\n    train_entries = safe_get(ds_data, \"metrics\", \"train\", default=[])\n    final = None\n    for tag, vals in train_entries:\n        if tag == \"final\":\n            final = vals\n    out = {}\n    if final:\n        out[\"train loss\"] = final.get(\"loss\", None)\n        out[\"train accuracy\"] = final.get(\"acc\", None)\n        out[\"train F1 score\"] = final.get(\"macro_f1\", None)\n        out[\"train top-3 accuracy\"] = final.get(\"top3\", None)\n    else:\n        # Fallback: try last value from losses for loss only\n        train_losses = safe_get(ds_data, \"losses\", \"train\", default=[])\n        if train_losses:\n            out[\"train loss\"] = train_losses[-1][1]\n    return out\n\n\ndef extract_best_val_metrics(ds_data):\n    # Collect per-epoch validation metrics (acc, macro_f1, top3)\n    val_entries = safe_get(ds_data, \"metrics\", \"val\", default=[])\n    best = {\n        \"validation accuracy\": None,\n        \"validation F1 score\": None,\n        \"validation top-3 accuracy\": None,\n    }\n    for tag, vals in val_entries:\n        if isinstance(vals, dict):\n            acc = vals.get(\"acc\", None)\n            f1 = vals.get(\"macro_f1\", None)\n            top3 = vals.get(\"top3\", None)\n            if acc is not None:\n                best[\"validation accuracy\"] = (\n                    acc\n                    if best[\"validation accuracy\"] is None\n                    else max(best[\"validation accuracy\"], acc)\n                )\n            if f1 is not None:\n                best[\"validation F1 score\"] = (\n                    f1\n                    if best[\"validation F1 score\"] is None\n                    else max(best[\"validation F1 score\"], f1)\n                )\n            if top3 is not None:\n                best[\"validation top-3 accuracy\"] = (\n                    top3\n                    if best[\"validation top-3 accuracy\"] is None\n                    else max(best[\"validation top-3 accuracy\"], top3)\n                )\n    # For validation loss, use recorded losses per epoch and take the minimum\n    val_losses = safe_get(ds_data, \"losses\", \"val\", default=[])\n    if val_losses:\n        min_val_loss = min((v for (_, v) in val_losses), default=None)\n    else:\n        # fallback: check 'final' val entry if present\n        min_val_loss = None\n        for tag, vals in val_entries:\n            if tag == \"final\" and isinstance(vals, dict):\n                min_val_loss = vals.get(\"loss\", None)\n                break\n    out = {\"validation loss\": min_val_loss}\n    out.update(best)\n    return out\n\n\ndef extract_final_test_metrics(ds_data):\n    test_entries = safe_get(ds_data, \"metrics\", \"test\", default=[])\n    final = None\n    for tag, vals in test_entries:\n        if tag == \"final\":\n            final = vals\n    out = {}\n    if final:\n        out[\"test loss\"] = final.get(\"loss\", None)\n        out[\"test accuracy\"] = final.get(\"acc\", None)\n        out[\"test F1 score\"] = final.get(\"macro_f1\", None)\n        out[\"test top-3 accuracy\"] = final.get(\"top3\", None)\n    return out\n\n\ndef format_print_metrics(dataset_name, metrics_dict):\n    print(dataset_name)\n    # Keep a consistent order for readability\n    ordered_keys = [\n        \"train loss\",\n        \"train accuracy\",\n        \"train F1 score\",\n        \"train top-3 accuracy\",\n        \"validation loss\",\n        \"validation accuracy\",\n        \"validation F1 score\",\n        \"validation top-3 accuracy\",\n        \"test loss\",\n        \"test accuracy\",\n        \"test F1 score\",\n        \"test top-3 accuracy\",\n    ]\n    printed_any = False\n    for k in ordered_keys:\n        if k in metrics_dict and metrics_dict[k] is not None:\n            val = metrics_dict[k]\n            if isinstance(val, float):\n                print(f\"{k}: {val:.4f}\")\n            else:\n                print(f\"{k}: {val}\")\n            printed_any = True\n    # Print any remaining keys that were not in the ordered list\n    for k, v in metrics_dict.items():\n        if k not in ordered_keys and v is not None:\n            if isinstance(v, float):\n                print(f\"{k}: {v:.4f}\")\n            else:\n                print(f\"{k}: {v}\")\n            printed_any = True\n    if not printed_any:\n        print(\"No metrics available\")\n\n\ndef run():\n    experiment_data = load_experiment_data()\n    for ds_name, ds_data in experiment_data.items():\n        all_metrics = {}\n        all_metrics.update(extract_final_train_metrics(ds_data))\n        all_metrics.update(extract_best_val_metrics(ds_data))\n        all_metrics.update(extract_final_test_metrics(ds_data))\n        format_print_metrics(ds_name, all_metrics)\n\n\n# Execute immediately\nrun()\n","parse_term_out":["BPI2012","\n","train loss: 0.5148","\n","train accuracy: 0.7777","\n","train F1 score: 0.5609","\n","train top-3 accuracy: 0.9868","\n","validation loss: 0.5073","\n","validation accuracy: 0.7639","\n","validation F1 score: 0.6007","\n","validation top-3 accuracy: 0.9861","\n","test loss: 0.5355","\n","test accuracy: 0.7569","\n","test F1 score: 0.5872","\n","test top-3 accuracy: 0.9874","\n","BPI2017","\n","train loss: 0.3607","\n","train accuracy: 0.8422","\n","train F1 score: 0.5721","\n","train top-3 accuracy: 0.9941","\n","validation loss: 0.3756","\n","validation accuracy: 0.8405","\n","validation F1 score: 0.6180","\n","validation top-3 accuracy: 0.9928","\n","test loss: 0.3877","\n","test accuracy: 0.8332","\n","test F1 score: 0.5710","\n","test top-3 accuracy: 0.9906","\n","ROAD","\n","train loss: 0.4662","\n","train accuracy: 0.7894","\n","train F1 score: 0.5395","\n","train top-3 accuracy: 0.9986","\n","validation loss: 0.4274","\n","validation accuracy: 0.8122","\n","validation F1 score: 0.6664","\n","validation top-3 accuracy: 0.9969","\n","test loss: 0.4833","\n","test accuracy: 0.8020","\n","test F1 score: 0.4740","\n","test top-3 accuracy: 0.9936","\n","Execution time: a moment seconds (time limit is an hour)."],"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":237.50487351417542,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":"Primary issue: Feature normalization is applied twice and leaks information across splits. In build_prefix_dataset(), continuous features (deltas and since_start) are normalized using statistics computed over all samples (including validation/test). Later in train_one_dataset(), you attempt to \u201cre-normalize\u201d using train-only stats by applying a z-score again to the already-normalized values. This both introduces leakage (initial global stats influenced test/val) and yields incorrect scaling (z-scoring an already standardized variable). Fix: Remove any normalization from build_prefix_dataset and return raw feature values. After performing the time-based case split, compute mean/std on train samples only and then normalize train/val/test features from their raw values. Implementation options:\n- Easiest: Add a flag normalize=False in build_prefix_dataset (default False) and skip the initial normalization. In train_one_dataset, after splitting, compute dt_mean,dt_std,ss_mean,ss_std from train samples and apply to all splits.\n- Alternatively, have build_prefix_dataset return both raw and normalized features or just raw, and do all normalization post-split.\nSecondary improvements (not hard bugs but recommended):\n- Exclude the PAD class from evaluation/top-k by zeroing its logit or masking it before softmax/topk, and compute macro-F1 over actual activity classes only. Also set ignore_index=pad_idx in CrossEntropyLoss if ever labels could be PAD.\n- Minor: when lifecycle filter removes all events, your fallback keeps all events; consider explicitly handling lifecycle values rather than silently reverting.\nDespite the normalization issue, the run completes and reports per-log next-activity metrics (acc, macro-F1, top-3) with time-based splits on BPI2012, BPI2017, and ROAD as required.","exp_results_dir":null,"metric":{"value":{"metric_names":[{"metric_name":"loss","lower_is_better":true,"description":"Cross-entropy loss on the test split; lower values indicate better performance.","data":[{"dataset_name":"BPI2012","final_value":0.5355,"best_value":0.5355},{"dataset_name":"BPI2017","final_value":0.3877,"best_value":0.3877},{"dataset_name":"ROAD","final_value":0.4833,"best_value":0.4833}]},{"metric_name":"accuracy","lower_is_better":false,"description":"Classification accuracy on the test split; proportion of correct predictions.","data":[{"dataset_name":"BPI2012","final_value":0.7569,"best_value":0.7569},{"dataset_name":"BPI2017","final_value":0.8332,"best_value":0.8332},{"dataset_name":"ROAD","final_value":0.802,"best_value":0.802}]},{"metric_name":"F1 score","lower_is_better":false,"description":"F1 score on the test split; harmonic mean of precision and recall.","data":[{"dataset_name":"BPI2012","final_value":0.5872,"best_value":0.5872},{"dataset_name":"BPI2017","final_value":0.571,"best_value":0.571},{"dataset_name":"ROAD","final_value":0.474,"best_value":0.474}]},{"metric_name":"top-3 accuracy","lower_is_better":false,"description":"Top-3 accuracy on the test split; proportion where the correct label is among the top 3 predictions.","data":[{"dataset_name":"BPI2012","final_value":0.9874,"best_value":0.9874},{"dataset_name":"BPI2017","final_value":0.9906,"best_value":0.9906},{"dataset_name":"ROAD","final_value":0.9936,"best_value":0.9936}]}]},"maximize":null,"name":null,"description":null},"is_buggy":true,"is_buggy_plots":null,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":[],"plot_paths":[],"plot_analyses":[],"vlm_feedback_summary":[],"datasets_successfully_tested":[],"ablation_name":null,"hyperparam_name":null,"is_seed_node":true,"is_seed_agg_node":false,"exec_time_feedback":""},{"code":"# plotting aggregation code","plan":"Aggregate results from multiple seeds","overall_plan":"","plot_code":"import matplotlib.pyplot as plt\nimport numpy as np\nimport os\n\nworking_dir = os.path.join(os.getcwd(), \"working\")\nos.makedirs(working_dir, exist_ok=True)\n\nfrom collections import defaultdict\nfrom sklearn.metrics import confusion_matrix\n\n\ndef safe_load_experiment(path_str):\n    try:\n        # Try environment-rooted path\n        root = os.getenv(\"AI_SCIENTIST_ROOT\")\n        if root is not None and len(root) > 0:\n            p = os.path.join(root, path_str)\n            if os.path.isfile(p):\n                return np.load(p, allow_pickle=True).item()\n        # Fallback: treat as relative/absolute path\n        if os.path.isfile(path_str):\n            return np.load(path_str, allow_pickle=True).item()\n        # Also try under working dir if provided as None/experiment_data.npy pattern\n        p2 = os.path.join(working_dir, os.path.basename(path_str))\n        if os.path.isfile(p2):\n            return np.load(p2, allow_pickle=True).item()\n    except Exception as e:\n        print(f\"Error loading experiment data from {path_str}: {e}\")\n    return None\n\n\ndef sem(a, axis=0):\n    a = np.array(a, dtype=float)\n    if a.size == 0:\n        return np.array([])\n    # count non-nan along axis\n    n = np.sum(~np.isnan(a), axis=axis)\n    std = np.nanstd(a, axis=axis, ddof=1)\n    with np.errstate(invalid=\"ignore\", divide=\"ignore\"):\n        se = std / np.sqrt(np.maximum(n, 1))\n    return se\n\n\ndef downsample_xs(xs, max_points=5):\n    xs_sorted = np.array(sorted(xs))\n    if len(xs_sorted) <= max_points:\n        return xs_sorted.tolist()\n    # pick approx quantile positions\n    qs = np.linspace(0, 1, num=max_points)\n    idx = np.unique(\n        np.clip((qs * (len(xs_sorted) - 1)).round().astype(int), 0, len(xs_sorted) - 1)\n    )\n    return xs_sorted[idx].tolist()\n\n\ndef main():\n    # Collect all experiment data dicts\n    try:\n        experiment_data_path_list = [\n            \"None/experiment_data.npy\",\n            \"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/experiment_57ccd5de0de34674be3985e9f94220ad_proc_361839/experiment_data.npy\",\n            \"None/experiment_data.npy\",\n        ]\n        all_experiment_data = []\n        for experiment_data_path in experiment_data_path_list:\n            data = safe_load_experiment(experiment_data_path)\n            if data is not None and isinstance(data, dict) and len(data) > 0:\n                all_experiment_data.append(data)\n            else:\n                print(\n                    f\"Skipped loading from {experiment_data_path} (missing or empty).\"\n                )\n        if len(all_experiment_data) == 0:\n            print(\"No experiment_data loaded; nothing to plot.\")\n            return\n    except Exception as e:\n        print(f\"Error loading experiment data: {e}\")\n        all_experiment_data = []\n        return\n\n    # Build dataset -> list of run dicts\n    datasets_runs = defaultdict(list)\n    for run_idx, exp_dict in enumerate(all_experiment_data):\n        for ds_name, ds_payload in exp_dict.items():\n            datasets_runs[ds_name].append(ds_payload)\n\n    # Aggregate and plot per dataset\n    for ds_name, runs in datasets_runs.items():\n        # Aggregate losses (train/val) by aligning epochs to min length\n        try:\n            # Collect lists of loss sequences\n            train_losses = []\n            val_losses = []\n            for r in runs:\n                tr = r.get(\"losses\", {}).get(\"train\", [])\n                vl = r.get(\"losses\", {}).get(\"val\", [])\n                # entries are list of (epoch, value) or just values; normalize to values\n                tr_vals = (\n                    [y for (_, y) in tr]\n                    if len(tr) > 0 and isinstance(tr[0], (list, tuple))\n                    else list(tr)\n                )\n                vl_vals = (\n                    [y for (_, y) in vl]\n                    if len(vl) > 0 and isinstance(vl[0], (list, tuple))\n                    else list(vl)\n                )\n                if len(tr_vals) > 0:\n                    train_losses.append(np.array(tr_vals, dtype=float))\n                if len(vl_vals) > 0:\n                    val_losses.append(np.array(vl_vals, dtype=float))\n            # Plot if we have at least one train or val\n            if len(train_losses) > 0 or len(val_losses) > 0:\n                plt.figure()\n                subtitle = \"Aggregated across runs | Next-activity\"\n                if len(train_losses) > 0:\n                    L = min([len(a) for a in train_losses])\n                    TL = np.stack([a[:L] for a in train_losses], axis=0)\n                    mean_tr = np.nanmean(TL, axis=0)\n                    sem_tr = sem(TL, axis=0)\n                    xs = np.arange(1, L + 1)\n                    plt.plot(xs, mean_tr, label=\"Train (Mean)\", color=\"tab:blue\")\n                    plt.fill_between(\n                        xs,\n                        mean_tr - sem_tr,\n                        mean_tr + sem_tr,\n                        color=\"tab:blue\",\n                        alpha=0.2,\n                        label=\"Train (SEM)\",\n                    )\n                if len(val_losses) > 0:\n                    L = min([len(a) for a in val_losses])\n                    VL = np.stack([a[:L] for a in val_losses], axis=0)\n                    mean_va = np.nanmean(VL, axis=0)\n                    sem_va = sem(VL, axis=0)\n                    xs = np.arange(1, L + 1)\n                    plt.plot(xs, mean_va, label=\"Val (Mean)\", color=\"tab:orange\")\n                    plt.fill_between(\n                        xs,\n                        mean_va - sem_va,\n                        mean_va + sem_va,\n                        color=\"tab:orange\",\n                        alpha=0.2,\n                        label=\"Val (SEM)\",\n                    )\n                plt.legend()\n                plt.xlabel(\"Epoch\")\n                plt.ylabel(\"Loss\")\n                plt.title(f\"{ds_name} - Loss Curves\\n{subtitle}\")\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(working_dir, f\"{ds_name}_aggregated_loss_curves.png\")\n                )\n                plt.close()\n        except Exception as e:\n            print(f\"Error creating aggregated loss curves for {ds_name}: {e}\")\n            plt.close()\n\n        # Aggregate test metrics across runs and bar plot with error bars\n        try:\n            metrics_list = []\n            for r in runs:\n                test_entries = r.get(\"metrics\", {}).get(\"test\", [])\n                if isinstance(test_entries, list) and len(test_entries) > 0:\n                    # take first entry's dict\n                    m = (\n                        dict(test_entries[0][1])\n                        if isinstance(test_entries[0], (list, tuple))\n                        else dict(test_entries[0])\n                    )\n                    # Only keep numeric keys\n                    usable = {\n                        k: float(v)\n                        for k, v in m.items()\n                        if isinstance(v, (int, float, np.floating))\n                    }\n                    if len(usable) > 0:\n                        metrics_list.append(usable)\n            if len(metrics_list) > 0:\n                keys = [\"acc\", \"macro_f1\", \"top3\", \"loss\"]\n                vals = []\n                for k in keys:\n                    arr = [d.get(k, np.nan) for d in metrics_list]\n                    vals.append(arr)\n                means = [np.nanmean(a) for a in vals]\n                errors = [sem(a) for a in vals]\n                xs = np.arange(len(keys))\n                plt.figure()\n                plt.bar(\n                    xs,\n                    means,\n                    yerr=errors,\n                    capsize=4,\n                    color=[\"tab:green\", \"tab:purple\", \"tab:red\", \"tab:gray\"],\n                    alpha=0.8,\n                    label=\"Mean \u00b1 SEM\",\n                )\n                plt.xticks(xs, keys)\n                plt.ylabel(\"Value\")\n                plt.title(\n                    f\"{ds_name} - Aggregated Test Metrics\\nAggregated across runs | Next-activity\"\n                )\n                plt.legend()\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(working_dir, f\"{ds_name}_aggregated_test_metrics.png\")\n                )\n                plt.close()\n                # Print metrics\n                print(\n                    f\"{ds_name} | Test metrics (mean \u00b1 SEM): \"\n                    + \", \".join(\n                        [f\"{k}={m:.4f}\u00b1{e:.4f}\" for k, m, e in zip(keys, means, errors)]\n                    )\n                )\n        except Exception as e:\n            print(f\"Error creating aggregated test metrics for {ds_name}: {e}\")\n            plt.close()\n\n        # Aggregate Top-3 vs Prefix Length across runs (mean \u00b1 SEM), downsample xs to at most 5\n        try:\n            per_run_maps = []\n            all_L = set()\n            for r in runs:\n                pref = r.get(\"prefix_lens\", [])\n                flags = r.get(\"top3_flags\", [])\n                if len(pref) > 0 and len(flags) > 0:\n                    d = defaultdict(list)\n                    for L, f in zip(pref, flags):\n                        d[int(L)].append(int(f))\n                    # per-run mean per L\n                    run_map = {L: float(np.mean(v)) for L, v in d.items() if len(v) > 0}\n                    if len(run_map) > 0:\n                        per_run_maps.append(run_map)\n                        all_L.update(run_map.keys())\n            if len(per_run_maps) > 0:\n                xs_all = sorted(list(all_L))\n                xs_plot = downsample_xs(xs_all, max_points=5)\n                # Build matrix R x X with NaNs for missing\n                R = len(per_run_maps)\n                X = len(xs_plot)\n                M = np.full((R, X), np.nan, dtype=float)\n                for i, run_map in enumerate(per_run_maps):\n                    for j, L in enumerate(xs_plot):\n                        if L in run_map:\n                            M[i, j] = run_map[L]\n                mean_y = np.nanmean(M, axis=0)\n                err_y = sem(M, axis=0)\n                plt.figure()\n                plt.errorbar(\n                    xs_plot, mean_y, yerr=err_y, fmt=\"-o\", capsize=3, label=\"Mean \u00b1 SEM\"\n                )\n                plt.ylim(0.0, 1.0)\n                plt.xlabel(\"Prefix Length\")\n                plt.ylabel(\"Top-3 Accuracy\")\n                plt.title(\n                    f\"{ds_name} - Top-3 Accuracy vs Prefix Length\\nAggregated across runs | Next-activity\"\n                )\n                plt.legend()\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(\n                        working_dir, f\"{ds_name}_aggregated_top3_vs_prefixlen.png\"\n                    )\n                )\n                plt.close()\n        except Exception as e:\n            print(\n                f\"Error creating aggregated Top-3 vs Prefix Length for {ds_name}: {e}\"\n            )\n            plt.close()\n\n        # Aggregated confusion matrix (sum over runs)\n        try:\n            cm_sum = None\n            for r in runs:\n                y_true = r.get(\"ground_truth\", [])\n                y_pred = r.get(\"predictions\", [])\n                if len(y_true) > 0 and len(y_pred) > 0:\n                    # compute confusion for the labels present in this run\n                    labels = sorted(set(y_true) | set(y_pred))\n                    cm = confusion_matrix(y_true, y_pred, labels=labels)\n                    if cm_sum is None:\n                        cm_sum = cm\n                        cm_labels = labels\n                    else:\n                        # align labels\n                        all_labels = sorted(set(cm_labels) | set(labels))\n                        # expand cm_sum\n                        new_sum = np.zeros(\n                            (len(all_labels), len(all_labels)), dtype=int\n                        )\n                        # map old indices\n                        idx_old = {lab: i for i, lab in enumerate(cm_labels)}\n                        idx_new = {lab: i for i, lab in enumerate(all_labels)}\n                        for lab_i in cm_labels:\n                            for lab_j in cm_labels:\n                                new_sum[idx_new[lab_i], idx_new[lab_j]] += cm_sum[\n                                    idx_old[lab_i], idx_old[lab_j]\n                                ]\n                        # add current cm\n                        idx_cur = {lab: i for i, lab in enumerate(labels)}\n                        for lab_i in labels:\n                            for lab_j in labels:\n                                new_sum[idx_new[lab_i], idx_new[lab_j]] += cm[\n                                    idx_cur[lab_i], idx_cur[lab_j]\n                                ]\n                        cm_sum = new_sum\n                        cm_labels = all_labels\n            if cm_sum is not None:\n                plt.figure(figsize=(6, 5))\n                plt.imshow(cm_sum, aspect=\"auto\", cmap=\"Blues\")\n                plt.colorbar()\n                plt.title(\n                    f\"{ds_name} - Aggregated Confusion Matrix (Test)\\nAggregated across runs | Next-activity\"\n                )\n                plt.xlabel(\"Predicted\")\n                plt.ylabel(\"True\")\n                plt.tight_layout()\n                plt.savefig(\n                    os.path.join(\n                        working_dir, f\"{ds_name}_aggregated_confusion_matrix.png\"\n                    )\n                )\n                plt.close()\n        except Exception as e:\n            print(f\"Error creating aggregated confusion matrix for {ds_name}: {e}\")\n            plt.close()\n\n\nif __name__ == \"__main__\":\n    main()\n","plot_plan":null,"step":13,"id":"29473c6cb5124b67b0cb64d51dcc73c2","ctime":1757762831.244125,"_term_out":null,"parse_metrics_plan":"","parse_metrics_code":"","parse_term_out":null,"parse_exc_type":null,"parse_exc_info":null,"parse_exc_stack":null,"exec_time":null,"exc_type":null,"exc_info":null,"exc_stack":null,"analysis":null,"exp_results_dir":"experiments/2025-09-13_11-32-42_resource_centric_ppm_agents_attempt_0/logs/0-run/experiment_results/seed_aggregation_29473c6cb5124b67b0cb64d51dcc73c2","metric":{"value":null,"maximize":null,"name":null,"description":null},"is_buggy":false,"is_buggy_plots":null,"parent_id":null,"children":[],"plot_data":{},"plots_generated":false,"plots":[],"plot_paths":[],"plot_analyses":[],"vlm_feedback_summary":[],"datasets_successfully_tested":[],"ablation_name":null,"hyperparam_name":null,"is_seed_node":true,"is_seed_agg_node":true,"exec_time_feedback":""}],"node2parent":{"95afc8fd95764ce68e602a1cb05b0950":"726b2721d45c4800b9381c5d265fefcb","adda9b403f3744f1aa79ef815a1e80c9":"726b2721d45c4800b9381c5d265fefcb","8809469610964dfb89ac1f461173f888":"726b2721d45c4800b9381c5d265fefcb","28ff0ab9ab904c7b8042dbf7d450c79f":"726b2721d45c4800b9381c5d265fefcb","251df5cdee2b452db709366215875b0a":"95afc8fd95764ce68e602a1cb05b0950","4b69709685c641ddb0c83c8ee9b5d661":"726b2721d45c4800b9381c5d265fefcb","b6970d0586c74652a8d858ed9350bd81":"8809469610964dfb89ac1f461173f888","a1bad1cf5aec4ddfbb370ed8a179b41b":"726b2721d45c4800b9381c5d265fefcb","658ae461b48144a5bce939113f629297":"726b2721d45c4800b9381c5d265fefcb","26f8c955090b4c65877fc01f0de569ba":"726b2721d45c4800b9381c5d265fefcb","57ccd5de0de34674be3985e9f94220ad":"726b2721d45c4800b9381c5d265fefcb","852328dac5e14beb9bfce93a32da5a6a":"726b2721d45c4800b9381c5d265fefcb","29473c6cb5124b67b0cb64d51dcc73c2":"726b2721d45c4800b9381c5d265fefcb"},"__version":"2"}