{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "38091062-745e-473a-b6a5-18da737dbcfb",
   "metadata": {},
   "outputs": [],
   "source": [
    "!pip install openai\n",
    "!pip install networkx\n",
    "!pip install pydantic\n",
    "!pip install sentence_transformers\n",
    "!pip install scikit-learn\n",
    "!pip install POT\n",
    "!pip install huggingface_hub\n",
    "!pip install datasets\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c3d79808-94f4-4d24-a205-8aa62ae4635c",
   "metadata": {},
   "outputs": [],
   "source": [
    "!python -m spacy download en_core_web_sm\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e61d0bc0-1f7e-4c26-8d3e-00528141d134",
   "metadata": {},
   "outputs": [],
   "source": [
    "#Download ollama\n",
    "!curl -fsSL https://ollama.com/install.sh | sh\n",
    "import subprocess\n",
    "process = subprocess.Popen(\"ollama serve\", shell=True) #runs on a different thread"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "08102532-ab99-46cc-9fd4-c1803e0329be",
   "metadata": {},
   "outputs": [],
   "source": [
    "%%capture --no-display\n",
    "\n",
    "!ollama pull llama3 "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "eea8ed37-932c-4e12-a272-582b0182278d",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Text processing\n",
    "def structure_text(text, nlp, max_chunk_size=500000):\n",
    "    \"\"\"\n",
    "    Structure a text into a NetworkX graph with handling of very long texts.\n",
    "    \n",
    "    Args:\n",
    "        text: The text to structure\n",
    "        nlp: The spaCy model\n",
    "        max_chunk_size: Maximum chunk size to avoid memory errors\n",
    "    \"\"\"\n",
    "    graph = nx.DiGraph()\n",
    "    doc_id = \"document\"\n",
    "    graph.add_node(doc_id, type=\"document\", text=\"Document\")\n",
    "\n",
    "    # For very long texts, we first divide into smaller chunks\n",
    "    if len(text) > max_chunk_size:\n",
    "        # Divide text into maximum-sized chunks trying to cut at paragraphs\n",
    "        chunks = []\n",
    "        current_chunk = \"\"\n",
    "        \n",
    "        sections = text.split(\"\\n\\n\")\n",
    "        for section in sections:\n",
    "            if len(current_chunk) + len(section) + 2 <= max_chunk_size:\n",
    "                current_chunk += section + \"\\n\\n\" if current_chunk else section\n",
    "            else:\n",
    "                if current_chunk:\n",
    "                    chunks.append(current_chunk.strip())\n",
    "                current_chunk = section\n",
    "        \n",
    "        if current_chunk:\n",
    "            chunks.append(current_chunk.strip())\n",
    "            \n",
    "        # Process each chunk separately\n",
    "        for chunk_idx, chunk in enumerate(chunks):\n",
    "            chunk_sections = chunk.split(\"\\n\\n\")\n",
    "            section_count = chunk_idx * 1000  # Offset to avoid ID collisions\n",
    "            \n",
    "            for sec in chunk_sections:\n",
    "                sec = sec.strip()\n",
    "                if not sec:\n",
    "                    continue\n",
    "\n",
    "                section_id = f\"section_{section_count}\"\n",
    "                graph.add_node(section_id, type=\"section\", text=sec[:200] + \"...\" if len(sec) > 200 else sec)\n",
    "                graph.add_edge(doc_id, section_id)\n",
    "\n",
    "                paragraphs = sec.split(\"\\n\")\n",
    "                for p_idx, paragraph in enumerate(paragraphs):\n",
    "                    paragraph = paragraph.strip()\n",
    "                    if not paragraph:\n",
    "                        continue\n",
    "\n",
    "                    para_id = f\"{section_id}_para_{p_idx}\"\n",
    "                    graph.add_node(para_id, type=\"paragraph\", text=paragraph)\n",
    "                    graph.add_edge(section_id, para_id)\n",
    "\n",
    "                section_count += 1\n",
    "    else:\n",
    "        # Normal processing for shorter texts\n",
    "        sections = text.split(\"\\n\\n\")\n",
    "        section_count = 0\n",
    "\n",
    "        for sec in sections:\n",
    "            sec = sec.strip()\n",
    "            if not sec:\n",
    "                continue\n",
    "\n",
    "            section_id = f\"section_{section_count}\"\n",
    "            graph.add_node(section_id, type=\"section\", text=sec.split(\"\\n\\n\")[0])\n",
    "            graph.add_edge(doc_id, section_id)\n",
    "\n",
    "            paragraphs = sec.split(\"\\n\")\n",
    "            for p_idx, paragraph in enumerate(paragraphs):\n",
    "                paragraph = paragraph.strip()\n",
    "                if not paragraph:\n",
    "                    continue\n",
    "\n",
    "                para_id = f\"{section_id}_para_{p_idx}\"\n",
    "                graph.add_node(para_id, type=\"paragraph\", text=paragraph)\n",
    "                graph.add_edge(section_id, para_id)\n",
    "\n",
    "                # Note: We avoid spaCy processing here as it can cause memory errors\n",
    "                # with very long texts. The graph is built only on structure.\n",
    "\n",
    "            section_count += 1\n",
    "\n",
    "    return graph"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "2059580f-48b8-440b-a0de-b15cc02cb863",
   "metadata": {},
   "outputs": [],
   "source": [
    "from openai import OpenAI\n",
    "import spacy\n",
    "import networkx as nx\n",
    "import matplotlib.pyplot as plt\n",
    "import json\n",
    "import pandas as pd\n",
    "# Exemple d'affichage du graphe d'une question :\n",
    "import matplotlib.pyplot as plt\n",
    "import os \n",
    "import json\n",
    "from sentence_transformers import SentenceTransformer\n",
    "import time\n",
    "\n",
    "nlp = spacy.load(\"en_core_web_sm\")\n",
    "model= SentenceTransformer(\"all-MiniLM-L6-v2\")\n",
    "client = OpenAI(base_url=\"http://localhost:11434/v1\", api_key=\"ollama\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8f49225f-1391-480a-9a0d-a2783da521e6",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pickle\n",
    "import json\n",
    "\n",
    "def generate_graphs_from_longbench_df(df, start_index=0, max_items=None, output_dir=\"/workspace/longbench-data\", save_every=10):\n",
    "    \"\"\"\n",
    "    Generate NetworkX graphs from a LongBench-v2 DataFrame.\n",
    "    Save results periodically to files.\n",
    "    \n",
    "    df : DataFrame with columns '_id', 'question', 'context', 'choice_A', 'choice_B', 'choice_C', 'choice_D', 'answer'\n",
    "    start_index : DataFrame row to start from\n",
    "    max_items : maximum number of items to process (None = all)\n",
    "    output_dir : output directory for files\n",
    "    save_every : save every N processed items\n",
    "    \"\"\"\n",
    "    import os\n",
    "    \n",
    "    # Create output directory if it doesn't exist\n",
    "    os.makedirs(output_dir, exist_ok=True)\n",
    "    \n",
    "    graphs_by_id = {}\n",
    "    questions_by_id = {}\n",
    "    choices_by_id = {}\n",
    "    answers_by_id = {}\n",
    "\n",
    "    end_index = len(df) if max_items is None else min(start_index + max_items, len(df))\n",
    "    \n",
    "    # Output files\n",
    "    graphs_file = os.path.join(output_dir, \"longbench_graphs.pkl\")\n",
    "    questions_file = os.path.join(output_dir, \"longbench_questions.json\")\n",
    "    choices_file = os.path.join(output_dir, \"longbench_choices.json\")\n",
    "    answers_file = os.path.join(output_dir, \"longbench_answers.json\")\n",
    "    \n",
    "    # Load existing data if it exists\n",
    "    if os.path.exists(graphs_file):\n",
    "        print(\"Loading existing graphs...\")\n",
    "        try:\n",
    "            with open(graphs_file, 'rb') as f:\n",
    "                graphs_by_id = pickle.load(f)\n",
    "        except:\n",
    "            print(\"Error loading graphs, restarting...\")\n",
    "            graphs_by_id = {}\n",
    "    \n",
    "    if os.path.exists(questions_file):\n",
    "        try:\n",
    "            with open(questions_file, 'r') as f:\n",
    "                questions_by_id = json.load(f)\n",
    "            with open(choices_file, 'r') as f:\n",
    "                choices_by_id = json.load(f)\n",
    "            with open(answers_file, 'r') as f:\n",
    "                answers_by_id = json.load(f)\n",
    "        except:\n",
    "            print(\"Error loading metadata, restarting...\")\n",
    "            questions_by_id = {}\n",
    "            choices_by_id = {}\n",
    "            answers_by_id = {}\n",
    "\n",
    "    processed_count = 0\n",
    "    for i in range(start_index, end_index):\n",
    "        row = df.iloc[i]\n",
    "        qid = row[\"_id\"]\n",
    "        \n",
    "        # Check if already processed\n",
    "        if qid in graphs_by_id:\n",
    "            print(f\"Skipping already processed index {i}, question ID: {qid}\")\n",
    "            continue\n",
    "        \n",
    "        print(f\"Processing index {i}/{end_index-1}, question ID: {qid}\")\n",
    "        \n",
    "        try:\n",
    "            # Extract data\n",
    "            question = row[\"question\"]\n",
    "            context = row[\"context\"]\n",
    "            \n",
    "            # Create graph from context\n",
    "            G = structure_text(context, nlp)\n",
    "            \n",
    "            # Store data\n",
    "            graphs_by_id[qid] = G\n",
    "            questions_by_id[qid] = question\n",
    "            choices_by_id[qid] = {\n",
    "                \"A\": row.get(\"choice_A\", \"\"),\n",
    "                \"B\": row.get(\"choice_B\", \"\"),  \n",
    "                \"C\": row.get(\"choice_C\", \"\"),\n",
    "                \"D\": row.get(\"choice_D\", \"\")\n",
    "            }\n",
    "            answers_by_id[qid] = row[\"answer\"]\n",
    "            \n",
    "            processed_count += 1\n",
    "            \n",
    "            # Periodic save\n",
    "            if processed_count % save_every == 0:\n",
    "                print(f\"Saving after {processed_count} items...\")\n",
    "                \n",
    "                with open(graphs_file, 'wb') as f:\n",
    "                    pickle.dump(graphs_by_id, f)\n",
    "                with open(questions_file, 'w') as f:\n",
    "                    json.dump(questions_by_id, f, indent=2)\n",
    "                with open(choices_file, 'w') as f:\n",
    "                    json.dump(choices_by_id, f, indent=2)\n",
    "                with open(answers_file, 'w') as f:\n",
    "                    json.dump(answers_by_id, f, indent=2)\n",
    "                \n",
    "                print(f\"Saved {len(graphs_by_id)} graphs to files\")\n",
    "        \n",
    "        except Exception as e:\n",
    "            print(f\"Error processing question {qid}: {e}\")\n",
    "            continue\n",
    "    \n",
    "    # Final save\n",
    "    print(\"Final save...\")\n",
    "    with open(graphs_file, 'wb') as f:\n",
    "        pickle.dump(graphs_by_id, f)\n",
    "    with open(questions_file, 'w') as f:\n",
    "        json.dump(questions_by_id, f, indent=2)\n",
    "    with open(choices_file, 'w') as f:\n",
    "        json.dump(choices_by_id, f, indent=2)\n",
    "    with open(answers_file, 'w') as f:\n",
    "        json.dump(answers_by_id, f, indent=2)\n",
    "    \n",
    "    print(f\"Generation complete. Processed {processed_count} new items.\")\n",
    "    print(f\"Total graphs: {len(graphs_by_id)}\")\n",
    "    \n",
    "    return graphs_by_id, questions_by_id, choices_by_id, answers_by_id"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "23f39ddf-d3b9-4d80-903a-30edc7b8d094",
   "metadata": {},
   "outputs": [],
   "source": [
    "from pydantic import BaseModel, ConfigDict\n",
    "from typing import List,Dict,Optional,Tuple\n",
    "import numpy as np\n",
    "class EmbeddingStore(BaseModel):\n",
    "    vectors: Dict[str, np.ndarray]\n",
    "    model_config = ConfigDict(arbitrary_types_allowed=True)\n",
    "\n",
    "\n",
    "class TraversalStep(BaseModel):\n",
    "    node_id: str\n",
    "    similarity: Optional[float]  # None pour la racine\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "16ff3b37-c871-4e0e-a1c2-25251f1cefcb",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "T sum: 0.9999999999999991 FGW: 0.3253742472605895\n"
     ]
    }
   ],
   "source": [
    "# -*- coding: utf-8 -*-\n",
    "r\"\"\"\n",
    "FGW (Fused Gromov-Wasserstein) in PyTorch with **stabilized Sinkhorn** (log-domain)\n",
    "-------------------------------------------------------------------------------\n",
    "\n",
    "This module provides a *fully PyTorch / GPU-ready* implementation of FGW\n",
    "that replaces EMD (LP) subproblems with **stabilized Sinkhorn**.\n",
    "\n",
    "Objective (POT convention):\n",
    "    FGW(T) = (1 - alpha) * <M, T> + alpha * GW(T)\n",
    "\n",
    "- Direction subproblem (Frank–Wolfe):\n",
    "    min_T  <(1 - alpha) * M + alpha * grad_GW(G), T>  +  eps * KL(T || a \\otimes b)\n",
    "  solved by log-domain Sinkhorn (stabilized), constraint T\\mathbf{1}=a, T^T\\mathbf{1}=b.\n",
    "\n",
    "- Line search: closed-form quadratic POT-style on the GW part (non-entropic),\n",
    "  which works very well in practice.\n",
    "\n",
    "Notes\n",
    "- p, q are normalized internally (sum = 1) for stability.\n",
    "- float64 computation recommended (like POT); everything follows M's device.\n",
    "- No external dependencies (KeOps optional but not required).\n",
    "- Polished allows making a call to an exact emd solver in the last iteration\n",
    "\n",
    "Main API\n",
    "- fused_gromov_wasserstein_sinkhorn(...)\n",
    "- fused_gromov_wasserstein2_sinkhorn(...)\n",
    "\n",
    "\"\"\"\n",
    "from __future__ import annotations\n",
    "import math\n",
    "from typing import Callable, Optional, Tuple, Dict, Union\n",
    "import ot\n",
    "import torch\n",
    "import time\n",
    "# ---------------------------------------------------------------------------\n",
    "# FGW Utils: init_matrix, tensor_product, gw_loss, gw_grad (POT convention)\n",
    "# ---------------------------------------------------------------------------\n",
    "\n",
    "def _transform_matrix(C1: torch.Tensor, C2: torch.Tensor, loss_fun: str = 'square_loss') -> Tuple[torch.Tensor, torch.Tensor, torch.Tensor, torch.Tensor]:\n",
    "    if loss_fun != 'square_loss':\n",
    "        raise ValueError(f\"Unsupported loss_fun={loss_fun} (only 'square_loss')\")\n",
    "    fC1 = C1 ** 2\n",
    "    fC2 = C2 ** 2\n",
    "    hC1 = C1\n",
    "    hC2 = 2.0 * C2\n",
    "    return fC1, fC2, hC1, hC2\n",
    "\n",
    "\n",
    "def init_matrix(C1: torch.Tensor, C2: torch.Tensor, p: torch.Tensor, q: torch.Tensor, loss_fun: str = 'square_loss') -> Tuple[torch.Tensor, torch.Tensor, torch.Tensor]:\n",
    "    fC1, fC2, hC1, hC2 = _transform_matrix(C1, C2, loss_fun)\n",
    "    # constC = (fC1 @ p)[:,None] + [ (fC2 @ q)^T ][None,:]\n",
    "    constC1 = (fC1 @ p).unsqueeze(1)                   # (ns,1)\n",
    "    constC2 = (fC2 @ q).unsqueeze(0)                   # (1,nt)\n",
    "    constC = constC1 + constC2                         # (ns,nt)\n",
    "    return constC, hC1, hC2\n",
    "\n",
    "\n",
    "def tensor_product(constC: torch.Tensor, hC1: torch.Tensor, hC2: torch.Tensor, T: torch.Tensor) -> torch.Tensor:\n",
    "    # tens = constC - hC1 @ T @ hC2^T = constC - C1 T (2C2)^T = constC - 2 * C1 T C2^T\n",
    "    return constC - (hC1 @ T) @ hC2.T\n",
    "\n",
    "\n",
    "def gw_loss(constC: torch.Tensor, hC1: torch.Tensor, hC2: torch.Tensor, T: torch.Tensor) -> torch.Tensor:\n",
    "    tens = tensor_product(constC, hC1, hC2, T)\n",
    "    return (tens * T).sum()\n",
    "\n",
    "\n",
    "def gw_grad(constC: torch.Tensor, hC1: torch.Tensor, hC2: torch.Tensor, T: torch.Tensor) -> torch.Tensor:\n",
    "    # grad GW = 2 * tens\n",
    "    return 2.0 * tensor_product(constC, hC1, hC2, T)\n",
    "\n",
    "\n",
    "# ---------------------------------------------------------------------------\n",
    "# Stabilized Sinkhorn (log-domain)\n",
    "# ---------------------------------------------------------------------------\n",
    "\n",
    "def sinkhorn_log_stabilized(\n",
    "    a: torch.Tensor,\n",
    "    b: torch.Tensor,\n",
    "    C: torch.Tensor,\n",
    "    eps: float = 5e-3,\n",
    "    max_iter: int = 1_000,\n",
    "    tol: float = 1e-9,\n",
    "    stop_interval: int = 10,\n",
    "    log: bool = False,\n",
    "    f0: Optional[torch.Tensor] = None,\n",
    "    g0: Optional[torch.Tensor] = None\n",
    ") -> Tuple[torch.Tensor, Optional[Dict[str, torch.Tensor]]]:\n",
    "    \"\"\"Solve entropic OT with *stabilized* Sinkhorn in log-domain.\n",
    "\n",
    "    Minimizes:  <C, T> + eps * KL(T || a ⊗ b)  s.t. T1=a, T^T1=b, T>=0.\n",
    "\n",
    "    Returns the transport plan T and (optionally) dual potentials f, g.\n",
    "    \"\"\"\n",
    "    if a.dim() != 1 or b.dim() != 1 or C.dim() != 2:\n",
    "        raise ValueError(\"a,b must be 1D and C 2D\")\n",
    "    ns, nt = C.shape\n",
    "    if ns != a.shape[0] or nt != b.shape[0]:\n",
    "        raise ValueError(\"Shape mismatch: C(ns,nt), a(ns), b(nt)\")\n",
    "\n",
    "    # Normalize (avoid NaNs if sums differ a bit)\n",
    "    a = a / (a.sum() + 1e-300)\n",
    "    b = b / (b.sum() + 1e-300)\n",
    "\n",
    "    # log-domain potentials f,g; work in float64 for stability\n",
    "    dev = C.device\n",
    "    f = torch.zeros(C.shape[0], dtype=torch.float64, device=C.device) if f0 is None else f0.to(torch.float64)\n",
    "    g = torch.zeros(C.shape[1], dtype=torch.float64, device=C.device) if g0 is None else g0.to(torch.float64)\n",
    "    #f = torch.zeros(ns, dtype=torch.float64, device=dev)\n",
    "    #g = torch.zeros(nt, dtype=torch.float64, device=dev)\n",
    "    C64 = C.to(torch.float64)\n",
    "    a64 = a.to(torch.float64)\n",
    "    b64 = b.to(torch.float64)\n",
    "\n",
    "    # Precompute logs (handle zeros)\n",
    "    tiny = torch.finfo(torch.float64).tiny\n",
    "    loga = torch.where(a64 > 0, a64.log(), torch.full_like(a64, -float('inf')))\n",
    "    logb = torch.where(b64 > 0, b64.log(), torch.full_like(b64, -float('inf')))\n",
    "\n",
    "    def row_logsumexp(X: torch.Tensor) -> torch.Tensor:\n",
    "        # X: (ns, nt) -> lse over columns dim=1\n",
    "        m = torch.amax(X, dim=1, keepdim=True)\n",
    "        Z = torch.exp(X - m)\n",
    "        return (m.squeeze(1) + torch.log(Z.sum(dim=1) + tiny))\n",
    "\n",
    "    def col_logsumexp(X: torch.Tensor) -> torch.Tensor:\n",
    "        m = torch.amax(X, dim=0, keepdim=True)\n",
    "        Z = torch.exp(X - m)\n",
    "        return (m.squeeze(0) + torch.log(Z.sum(dim=0) + tiny))\n",
    "\n",
    "    last_err = None\n",
    "    for it in range(1, max_iter + 1):\n",
    "        # f-update\n",
    "        # f = eps * ( log a - logsumexp((g - C_ij)/eps over j) )\n",
    "        f = eps * (loga - row_logsumexp((g.unsqueeze(0) - C64) / eps))\n",
    "        # g-update\n",
    "        g = eps * (logb - col_logsumexp((f.unsqueeze(1) - C64) / eps))\n",
    "\n",
    "        if it % stop_interval == 0 or it == max_iter:\n",
    "            # build T only occasionally to check marginals\n",
    "            T = torch.exp((f.unsqueeze(1) + g.unsqueeze(0) - C64) / eps)\n",
    "            err_r = (T.sum(dim=1) - a64).abs().max()\n",
    "            err_c = (T.sum(dim=0) - b64).abs().max()\n",
    "            err = torch.max(err_r, err_c).item()\n",
    "            if last_err is None or err < last_err:\n",
    "                last_err = err\n",
    "            if err < tol:\n",
    "                break\n",
    "\n",
    "    # Final T\n",
    "    T = torch.exp((f.unsqueeze(1) + g.unsqueeze(0) - C64) / eps)\n",
    "\n",
    "    if log:\n",
    "        return T.to(C.dtype), {\n",
    "            'f': f.to(C.dtype),\n",
    "            'g': g.to(C.dtype),\n",
    "            'iters': torch.tensor(it),\n",
    "            'err': torch.tensor(last_err if last_err is not None else float('nan')),\n",
    "        }\n",
    "    return T.to(C.dtype), None\n",
    "\n",
    "\n",
    "# ---------------------------------------------------------------------------\n",
    "# Exact quadratic line search (POT formula)\n",
    "# ---------------------------------------------------------------------------\n",
    "\n",
    "def solve_gromov_linesearch(\n",
    "    G: torch.Tensor,\n",
    "    deltaG: torch.Tensor,\n",
    "    cost_G: torch.Tensor,\n",
    "    C1: torch.Tensor,\n",
    "    C2: torch.Tensor,\n",
    "    M_feat: torch.Tensor,   # (1-alpha) * M\n",
    "    reg_gw: float,          # alpha\n",
    "    symmetric: bool = False,\n",
    ") -> Tuple[torch.Tensor, int, torch.Tensor]:\n",
    "    # dot terms\n",
    "    dot_d = C1 @ deltaG @ C2.T\n",
    "    a = -reg_gw * (dot_d * deltaG).sum()\n",
    "\n",
    "    if symmetric:\n",
    "        b = (M_feat * deltaG).sum() - 2.0 * reg_gw * (dot_d * G).sum()\n",
    "    else:\n",
    "        b = (M_feat * deltaG).sum() - reg_gw * ( (dot_d * G).sum() + ((C1 @ G @ C2.T) * deltaG).sum() )\n",
    "\n",
    "    # min a t^2 + b t; convex if a>0, otherwise clip [0,1]\n",
    "    a_val = a.item()\n",
    "    b_val = b.item()\n",
    "    if a_val > 0:\n",
    "        t = -b_val / (2.0 * a_val)\n",
    "        alpha = torch.tensor(min(1.0, max(0.0, t)), device=G.device, dtype=G.dtype)\n",
    "    else:\n",
    "        alpha = torch.tensor(1.0 if (a_val + b_val) < 0 else 0.0, device=G.device, dtype=G.dtype)\n",
    "\n",
    "    cost_new = cost_G + a * (alpha ** 2) + b * alpha\n",
    "    return alpha, 1, cost_new\n",
    "\n",
    "\n",
    "# ---------------------------------------------------------------------------\n",
    "# Generic Conditional Gradient (the part that used emd)\n",
    "# ---------------------------------------------------------------------------\n",
    "\n",
    "def generic_conditional_gradient_sinkhorn(\n",
    "    a: torch.Tensor,\n",
    "    b: torch.Tensor,\n",
    "    M_feat: torch.Tensor,             # (1-alpha) * M\n",
    "    f: Callable[[torch.Tensor], torch.Tensor],\n",
    "    df: Callable[[torch.Tensor], torch.Tensor],\n",
    "    reg_gw: float,                    # alpha\n",
    "    G0: Optional[torch.Tensor],\n",
    "    eps: float,\n",
    "    C1: torch.Tensor,\n",
    "    C2: torch.Tensor,\n",
    "    numItermax: int = 200,\n",
    "    stopThr: float = 1e-9,\n",
    "    stopThr2: float = 1e-9,\n",
    "    verbose: bool = False,\n",
    "    log: bool = False,\n",
    "    sinkhorn_max_iter: int = 20,\n",
    "    sinkhorn_tol: float = 1e-9,\n",
    "    polished: bool = False\n",
    ") -> Union[torch.Tensor, Tuple[torch.Tensor, Dict]]:\n",
    "\n",
    "    device = M_feat.device\n",
    "    dtype = M_feat.dtype\n",
    "\n",
    "    if log:\n",
    "        log_dict: Dict[str, Union[float, torch.Tensor]] = {\"loss\": []}\n",
    "\n",
    "    # Init: barycentric plan\n",
    "    if G0 is None:\n",
    "        G = torch.outer(a, b)\n",
    "    else:\n",
    "        G = G0.clone()\n",
    "\n",
    "    def cost(G_: torch.Tensor) -> torch.Tensor:\n",
    "        return (M_feat * G_).sum() + reg_gw * f(G_)\n",
    "\n",
    "    cost_G = cost(G)\n",
    "    if log:\n",
    "        log_dict[\"loss\"].append(cost_G.item())\n",
    "\n",
    "    it = 0\n",
    "    if verbose:\n",
    "        print(f\"{'It.':<5s}|{'Loss':<12s}|{'Rel.d':<12s}|{'Abs.d':<12s}\")\n",
    "        print(\"-\" * 46)\n",
    "        print(f\"{it:<5d}|{cost_G.item():<12.4e}|{'0.0':<12s}|{'0.0':<12s}\")\n",
    "    f_cache = g_cache = None\n",
    "\n",
    "    while True:\n",
    "        it += 1\n",
    "        old_cost = cost_G\n",
    "\n",
    "        # Linearization\n",
    "        grad = df(G)\n",
    "        Mi = M_feat + reg_gw * grad\n",
    "        s = torch.median(Mi.abs()).item() + 1e-12\n",
    "        eps_use = eps * s\n",
    "\n",
    "        # Entropic subproblem (stabilized Sinkhorn)\n",
    "        Gc, logK = sinkhorn_log_stabilized(a, b, Mi, eps=eps_use, max_iter=sinkhorn_max_iter, tol=sinkhorn_tol, log=True, f0=f_cache, g0=g_cache)\n",
    "        f_cache = logK['f'] if log else None\n",
    "        g_cache = logK['g'] if log else None\n",
    "        # Direction and line search\n",
    "        deltaG = Gc - G\n",
    "        alpha_step, _, cost_G = solve_gromov_linesearch(G, deltaG, cost_G, C1, C2, M_feat, reg_gw, symmetric=False)\n",
    "\n",
    "        # Update\n",
    "        G = G + alpha_step * deltaG\n",
    "\n",
    "        # Convergence\n",
    "        if it >= numItermax:\n",
    "            break\n",
    "        abs_d = (cost_G - old_cost).abs()\n",
    "        rel_d = abs_d / (cost_G.abs() + 1e-300)\n",
    "        if log:\n",
    "            log_dict[\"loss\"].append(cost_G.item())\n",
    "        if verbose:\n",
    "            if it % 20 == 0:\n",
    "                print(f\"{'It.':<5s}|{'Loss':<12s}|{'Rel.d':<12s}|{'Abs.d':<12s}\")\n",
    "                print(\"-\" * 46)\n",
    "            print(f\"{it:<5d}|{cost_G.item():<12.4e}|{rel_d.item():<12.4e}|{abs_d.item():<12.4e}\")\n",
    "        if rel_d.item() < stopThr or abs_d.item() < stopThr2:\n",
    "            break\n",
    "    if polished:\n",
    "        time_loss = time.time()\n",
    "        # Add a last step, with an exact emd solver \n",
    "        M_final = M_feat + reg_gw * df(G)\n",
    "        T_exact, log_dict = ot.emd(a,b, M_final, numItermax=1000, log=True)\n",
    "        deltaG = T_exact - G\n",
    "        alpha_step, _, _ = solve_gromov_linesearch(G, deltaG, cost_G, C1, C2, M_feat, reg_gw, symmetric=False)\n",
    "        G = G + alpha_step * deltaG\n",
    "        print(f\"Polished in {time.time() - time_loss:.2f}s\")\n",
    "    if log:\n",
    "        return G, log_dict\n",
    "    return G\n",
    "\n",
    "\n",
    "# ---------------------------------------------------------------------------\n",
    "# FGW + stabilized Sinkhorn\n",
    "# ---------------------------------------------------------------------------\n",
    "\n",
    "def fused_gromov_wasserstein_sinkhorn(\n",
    "    M: torch.Tensor,\n",
    "    C1: torch.Tensor,\n",
    "    C2: torch.Tensor,\n",
    "    p: torch.Tensor,\n",
    "    q: torch.Tensor,\n",
    "    *,\n",
    "    loss_fun: str = 'square_loss',\n",
    "    alpha: float = 0.5,\n",
    "    eps: float = 5e-3,                   # Sinkhorn eps\n",
    "    armijo: bool = False,                # (ignored: quadratic LS used) left it because it was in pot\n",
    "    G0: Optional[torch.Tensor] = None,\n",
    "    log: bool = False,\n",
    "    numItermax: int = 200,\n",
    "    stopThr: float = 1e-9,\n",
    "    verbose: bool = False,\n",
    "    sinkhorn_max_iter: int = 20,\n",
    "    sinkhorn_tol: float = 1e-9,\n",
    "    polished: bool = False,\n",
    ") -> Union[torch.Tensor, Tuple[torch.Tensor, Dict]]:\n",
    "    \"\"\"FGW plan with stabilized Sinkhorn subproblems (GPU-ready).\"\"\"\n",
    "    # Normalization (safety)\n",
    "    p = (p / (p.sum() + 1e-300)).to(M.dtype)\n",
    "    q = (q / (q.sum() + 1e-300)).to(M.dtype)\n",
    "\n",
    "    constC, hC1, hC2 = init_matrix(C1, C2, p.to(C1.dtype), q.to(C2.dtype), loss_fun)\n",
    "\n",
    "    def f(G: torch.Tensor) -> torch.Tensor:\n",
    "        return gw_loss(constC, hC1, hC2, G)\n",
    "\n",
    "    def df(G: torch.Tensor) -> torch.Tensor:\n",
    "        return gw_grad(constC, hC1, hC2, G)\n",
    "\n",
    "    # POT weightings: (1-alpha) * W + alpha * GW\n",
    "    M_feat = (1.0 - alpha) * M\n",
    "    reg_gw = alpha\n",
    "\n",
    "    # Local monkey patch for solve_gromov_linesearch (access to C1/C2)\n",
    "    def solve_gromov_linesearch_local(G, dG, cost_G):\n",
    "        return solve_gromov_linesearch(G, dG, cost_G, C1, C2, M_feat, reg_gw, symmetric=False)\n",
    "\n",
    "    # Generic wrapper (reusing the LS above)\n",
    "    return generic_conditional_gradient_sinkhorn(\n",
    "        p, q, M_feat, f, df, reg_gw, G0, eps, C1, C2,\n",
    "        numItermax=numItermax, stopThr=stopThr, stopThr2=stopThr,\n",
    "        verbose=verbose, log=log,\n",
    "        sinkhorn_max_iter=sinkhorn_max_iter, sinkhorn_tol=sinkhorn_tol,\n",
    "        polished=polished\n",
    "    )\n",
    "\n",
    "\n",
    "def fused_gromov_wasserstein2_sinkhorn(\n",
    "    M: torch.Tensor,\n",
    "    C1: torch.Tensor,\n",
    "    C2: torch.Tensor,\n",
    "    p: torch.Tensor,\n",
    "    q: torch.Tensor,\n",
    "    *,\n",
    "    loss_fun: str = 'square_loss',\n",
    "    alpha: float = 0.5,\n",
    "    eps: float = 5e-3,\n",
    "    armijo: bool = False,\n",
    "    G0: Optional[torch.Tensor] = None,\n",
    "    log: bool = False,\n",
    "    numItermax: int = 200,\n",
    "    stopThr: float = 1e-9,\n",
    "    verbose: bool = False,\n",
    "    sinkhorn_max_iter: int = 20,\n",
    "    sinkhorn_tol: float = 1e-9,\n",
    "    polished: bool = False\n",
    ") -> Union[torch.Tensor, Tuple[torch.Tensor, Dict]]:\n",
    "    \"\"\"FGW distance (with stabilized Sinkhorn subproblems).\"\"\"\n",
    "    if log:\n",
    "        T, logd = fused_gromov_wasserstein_sinkhorn(\n",
    "            M, C1, C2, p, q, loss_fun=loss_fun, alpha=alpha, eps=eps,\n",
    "            armijo=armijo, G0=G0, log=True, numItermax=numItermax, stopThr=stopThr,\n",
    "            verbose=verbose, sinkhorn_max_iter=sinkhorn_max_iter, sinkhorn_tol=sinkhorn_tol,\n",
    "            polished=polished\n",
    "        )\n",
    "    else:\n",
    "        T = fused_gromov_wasserstein_sinkhorn(\n",
    "            M, C1, C2, p, q, loss_fun=loss_fun, alpha=alpha, eps=eps,\n",
    "            armijo=armijo, G0=G0, log=False, numItermax=numItermax, stopThr=stopThr,\n",
    "            verbose=verbose, sinkhorn_max_iter=sinkhorn_max_iter, sinkhorn_tol=sinkhorn_tol,\n",
    "            polished=polished\n",
    "        )\n",
    "\n",
    "    # Eval FGW (POT convention)\n",
    "    # NB: constC/hC1/hC2 recalculated for cleanliness (T might be of different dtype)\n",
    "    p_n = (p / (p.sum() + 1e-300)).to(M.dtype)\n",
    "    q_n = (q / (q.sum() + 1e-300)).to(M.dtype)\n",
    "    constC, hC1, hC2 = init_matrix(C1, C2, p_n.to(C1.dtype), q_n.to(C2.dtype), loss_fun)\n",
    "    W = (M * T).sum()\n",
    "    GW = gw_loss(constC, hC1, hC2, T)\n",
    "    fgw = (1.0 - alpha) * W + alpha * GW\n",
    "\n",
    "    if log:\n",
    "        logd['fgw_dist'] = fgw.detach().cpu().item()\n",
    "        return fgw, logd\n",
    "    return fgw\n",
    "\n",
    "\n",
    "# ---------------------------------------------------------------------------\n",
    "# Mini self-test\n",
    "# ---------------------------------------------------------------------------\n",
    "if __name__ == \"__main__\":\n",
    "    torch.set_printoptions(precision=4, sci_mode=True)\n",
    "    ns, nt = 5, 4\n",
    "    rng = torch.Generator().manual_seed(0)\n",
    "    C1 = torch.rand(ns, ns, generator=rng, dtype=torch.float64); C1 = 0.5*(C1+C1.T)\n",
    "    C2 = torch.rand(nt, nt, generator=rng, dtype=torch.float64); C2 = 0.5*(C2+C2.T)\n",
    "    X  = torch.rand(ns, 3, generator=rng, dtype=torch.float64)\n",
    "    Y  = torch.rand(nt, 3, generator=rng, dtype=torch.float64)\n",
    "    M  = torch.cdist(X, Y, p=2)\n",
    "    p  = torch.full((ns,), 1.0/ns, dtype=torch.float64)\n",
    "    q  = torch.full((nt,), 1.0/nt, dtype=torch.float64)\n",
    "    T  = fused_gromov_wasserstein_sinkhorn(M, C1, C2, p, q, alpha=0.3, eps=2e-2, numItermax=50, sinkhorn_max_iter=20)\n",
    "    d  = fused_gromov_wasserstein2_sinkhorn(M, C1, C2, p, q, alpha=0.3, eps=2e-2, numItermax=50, sinkhorn_max_iter=20)\n",
    "    print(\"T sum:\", T.sum().item(), \"FGW:\", float(d))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "058686ca-6e86-4dcb-8c9e-6d8f162f2963",
   "metadata": {},
   "outputs": [],
   "source": [
    "import networkx as nx\n",
    "import numpy as np\n",
    "from typing import List, Dict, Optional, Tuple\n",
    "from pydantic import BaseModel, Field, ConfigDict\n",
    "from sentence_transformers import SentenceTransformer\n",
    "from sklearn.metrics import pairwise_distances\n",
    "import ot\n",
    "from copy import deepcopy\n",
    "from sklearn.metrics.pairwise import cosine_similarity\n",
    "import os\n",
    "import torch.nn.functional as F\n",
    "\n",
    "model_path = \"sentence-transformers/all-MiniLM-L6-v2\"  # HF repo name\n",
    "\n",
    "\n",
    "def compute_embeddings(graphs: List[nx.Graph],\n",
    "                       model: Optional[SentenceTransformer] = None,\n",
    "                       device: Optional[torch.device] = None,\n",
    "                       dtype: torch.dtype = torch.float64) -> List[torch.Tensor]:\n",
    "    \"\"\"\n",
    "    Same API as before, but returns torch tensors [ns, d], normalized.\n",
    "    \"\"\"\n",
    "    if model is None:\n",
    "        model = SentenceTransformer(model_path, trust_remote_code=False)\n",
    "\n",
    "    if device is None:\n",
    "        device = torch.device(\"cuda\") if torch.cuda.is_available() else torch.device(\"cpu\")\n",
    "\n",
    "    out: List[torch.Tensor] = []\n",
    "    for G in graphs:\n",
    "        texts = [G.nodes[n][\"text\"] for n in G.nodes()]\n",
    "        # normalize_embeddings=True already L2-normalizes; convert_to_tensor keeps torch\n",
    "        E = model.encode(texts, normalize_embeddings=True, convert_to_tensor=True, device=str(device))\n",
    "        E = E.to(dtype=dtype)  # enforce float64 for numerical parity with POT\n",
    "        out.append(E)\n",
    "    return out\n",
    "\n",
    "\n",
    "# ========== Distance normalizations (torch) ==========\n",
    "\n",
    "def _ensure_tensor(x, dtype=torch.float64, device=None) -> torch.Tensor:\n",
    "    if isinstance(x, torch.Tensor):\n",
    "        return x.to(dtype=dtype, device=device if device is not None else x.device)\n",
    "    xt = torch.as_tensor(x, dtype=dtype)\n",
    "    return xt.to(device) if device is not None else xt\n",
    "\n",
    "\n",
    "def normalize_distance(D: torch.Tensor, factor: float = 1.5) -> torch.Tensor:\n",
    "    D = _ensure_tensor(D)\n",
    "    D = D.clone()\n",
    "    finite = torch.isfinite(D) & (D > 0)\n",
    "    if finite.any():\n",
    "        penalty = torch.quantile(D[finite], 0.95) * factor\n",
    "    else:\n",
    "        penalty = torch.tensor(1.0, dtype=D.dtype, device=D.device)\n",
    "    D[torch.isinf(D)] = penalty\n",
    "    # keep zeros on diagonal\n",
    "    if D.ndim == 2 and D.shape[0] == D.shape[1]:\n",
    "        D.fill_diagonal_(0)\n",
    "    return D\n",
    "\n",
    "\n",
    "def normalize_distance_exp(D: torch.Tensor, factor: float = 1.5, sim_power: float = 1.0) -> torch.Tensor:\n",
    "    D = _ensure_tensor(D)\n",
    "    D = D.clone()\n",
    "    penalty = torch.exp(torch.tensor(2.0, dtype=D.dtype, device=D.device)) * factor\n",
    "    D[torch.isinf(D)] = penalty\n",
    "    D[D <= 0] = penalty\n",
    "    if D.ndim == 2 and D.shape[0] == D.shape[1]:\n",
    "        D.fill_diagonal_(0.0)\n",
    "    return D\n",
    "\n",
    "\n",
    "# ========== Structure distances (torch) ==========\n",
    "\n",
    "def compute_structure_distances(graphs: List[nx.Graph], factor: float = 1.5) -> List[torch.Tensor]:\n",
    "    \"\"\"\n",
    "    Uses Floyd–Warshall via networkx (as in original), then converts to torch and normalizes.\n",
    "    \"\"\"\n",
    "    dists: List[torch.Tensor] = []\n",
    "    for G in graphs:\n",
    "        # exact same method as before\n",
    "        D_np = np.array(nx.floyd_warshall_numpy(G), dtype=np.float64)\n",
    "        D = torch.from_numpy(D_np)\n",
    "        D = normalize_distance(D, factor=factor)\n",
    "        dists.append(D)\n",
    "    return dists\n",
    "\n",
    "\n",
    "def compute_similarity_weighted_structure_distances(\n",
    "    graphs: List[nx.Graph],\n",
    "    embeddings: List[torch.Tensor],\n",
    "    factor: float = 1.5,\n",
    "    similarity_power: float = 1.0\n",
    ") -> List[torch.Tensor]:\n",
    "    \"\"\"\n",
    "    Follows the original logic exactly:\n",
    "    - build a weighted graph where edge weight = 1/(exp(sim)/e)**power\n",
    "    - then take the adjacency matrix (not shortest paths), normalize with 'exp' scheme\n",
    "    \"\"\"\n",
    "    weighted_dists: List[torch.Tensor] = []\n",
    "\n",
    "    for G, E in zip(graphs, embeddings):\n",
    "        # Ensure E is [ns, d] torch tensor, normalized (SentenceTransformer already did)\n",
    "        E = _ensure_tensor(E)\n",
    "\n",
    "        # Copy topology into weighted graph\n",
    "        G_weighted = nx.DiGraph() if G.is_directed() else nx.Graph()\n",
    "        G_weighted.add_nodes_from(G.nodes(data=True))\n",
    "\n",
    "        nodes_list = list(G.nodes)\n",
    "        idx = {n: i for i, n in enumerate(nodes_list)}\n",
    "\n",
    "        for u, v in G.edges():\n",
    "            eu = E[idx[u]]\n",
    "            ev = E[idx[v]]\n",
    "            # cosine similarity (manual, to mirror sklearn behavior with normalized E)\n",
    "            sim = F.cosine_similarity(eu.unsqueeze(0), ev.unsqueeze(0)).item()\n",
    "            transfo_sim = np.exp(sim) / np.exp(1)   # keep identical transform\n",
    "            adjusted_weight = 1.0 / ((transfo_sim ** similarity_power) + 1e-6)\n",
    "            G_weighted.add_edge(u, v, weight=float(adjusted_weight))\n",
    "\n",
    "        # Exactly like the original: adjacency matrix, then normalize_distance_exp\n",
    "        A = nx.adjacency_matrix(G_weighted, weight='weight').toarray().astype(np.float64)\n",
    "        D = torch.from_numpy(A)\n",
    "        D = normalize_distance_exp(D, factor=factor, sim_power=similarity_power)\n",
    "        weighted_dists.append(D)\n",
    "\n",
    "    return weighted_dists\n",
    "\n",
    "\n",
    "# ========== Cosine helper (unchanged semantics) ==========\n",
    "\n",
    "def safe_cosine_similarity(vec1, vec2) -> float:\n",
    "    v1 = np.asarray(vec1)\n",
    "    v2 = np.asarray(vec2)\n",
    "    norm1 = np.linalg.norm(v1)\n",
    "    norm2 = np.linalg.norm(v2)\n",
    "    if norm1 == 0 or norm2 == 0:\n",
    "        return 1/np.exp(2)\n",
    "    return float(cosine_similarity([v1], [v2])[0, 0])\n",
    "\n",
    "\n",
    "# ========== FGW / GW using Sinkhorn (torch) ==========\n",
    "\n",
    "\n",
    "def compute_fgw(\n",
    "    F1: torch.Tensor,\n",
    "    D1: torch.Tensor,\n",
    "    F2: torch.Tensor,\n",
    "    D2: torch.Tensor,\n",
    "    alpha: float = 0.5,\n",
    "    *,\n",
    "    eps: float = 2e-2,\n",
    "    sinkhorn_max_iter: int = 20,\n",
    "    sinkhorn_tol: float = 1e-9\n",
    ") -> Tuple[float, torch.Tensor]:\n",
    "    \"\"\"\n",
    "    Torch version mirroring original semantics:\n",
    "    - uniform p, q\n",
    "    - handle NaNs like before\n",
    "    - M = pairwise euclidean distances\n",
    "    - returns (dist, T)\n",
    "    \"\"\"\n",
    "    device = F1.device\n",
    "    dtype = torch.float64\n",
    "\n",
    "    F1 = _ensure_tensor(F1, dtype=dtype, device=device)\n",
    "    F2 = _ensure_tensor(F2, dtype=dtype, device=device)\n",
    "    D1 = _ensure_tensor(D1, dtype=dtype, device=device)\n",
    "    D2 = _ensure_tensor(D2, dtype=dtype, device=device)\n",
    "\n",
    "    ns, nt = F1.shape[0], F2.shape[0]\n",
    "    p = torch.full((ns,), 1.0/ns, dtype=dtype, device=device)\n",
    "    q = torch.full((nt,), 1.0/nt, dtype=dtype, device=device)\n",
    "\n",
    "    factor = 1.5\n",
    "    # NaN handling (same constants)\n",
    "    penalty = torch.exp(torch.tensor(2.0, dtype=dtype, device=device)) * factor\n",
    "    D1 = torch.nan_to_num(D1, nan=penalty.item())\n",
    "    D2 = torch.nan_to_num(D2, nan=penalty.item())\n",
    "\n",
    "    # Feature cost M\n",
    "    M = torch.cdist(F1, F2, p=2).to(dtype)\n",
    "\n",
    "    # Transport plan (Sinkhorn FGW)\n",
    "    T = fused_gromov_wasserstein_sinkhorn(\n",
    "        M, D1, D2, p, q, alpha=alpha,\n",
    "        eps=eps, numItermax=200, sinkhorn_max_iter=sinkhorn_max_iter,\n",
    "        sinkhorn_tol=sinkhorn_tol, log=False\n",
    "    )\n",
    "    # Distance (FGW2)\n",
    "    dist = fused_gromov_wasserstein2_sinkhorn(\n",
    "        M, D1, D2, p, q, alpha=alpha,\n",
    "        eps=eps, numItermax=200, sinkhorn_max_iter=sinkhorn_max_iter,\n",
    "        sinkhorn_tol=sinkhorn_tol, log=False\n",
    "    )\n",
    "    return float(dist.item()), T\n",
    "\n",
    "\n",
    "def compute_gw(D1: torch.Tensor, D2: torch.Tensor) -> Tuple[float, torch.Tensor]:\n",
    "    \"\"\"\n",
    "    Torch version of GW with uniform p/q (uses FGW with M=0 and alpha=1 for GW weight).\n",
    "    Returns (gw_dist, T)\n",
    "    \"\"\"\n",
    "    device = D1.device\n",
    "    dtype = torch.float64\n",
    "    D1 = _ensure_tensor(D1, dtype=dtype, device=device)\n",
    "    D2 = _ensure_tensor(D2, dtype=dtype, device=device)\n",
    "    ns, nt = D1.shape[0], D2.shape[0]\n",
    "    p = torch.full((ns,), 1.0/ns, dtype=dtype, device=device)\n",
    "    q = torch.full((nt,), 1.0/nt, dtype=dtype, device=device)\n",
    "    M = torch.zeros((ns, nt), dtype=dtype, device=device)\n",
    "\n",
    "    # Plan + distance\n",
    "    T = fused_gromov_wasserstein_sinkhorn(M, D1, D2, p, q, alpha=1.0, eps=2e-2, log=False)\n",
    "    dist = fused_gromov_wasserstein2_sinkhorn(M, D1, D2, p, q, alpha=1.0, eps=2e-2, log=False)\n",
    "    return float(dist.item()), T\n",
    "\n",
    "\n",
    "# ========== Graph helpers (unchanged behavior) ==========\n",
    "\n",
    "def assign_depths(G: nx.DiGraph):\n",
    "    if not nx.is_directed_acyclic_graph(G):\n",
    "        raise ValueError(\"Le graphe doit être un DAG pour que la profondeur soit bien définie.\")\n",
    "    depths = {}\n",
    "    for node in nx.topological_sort(G):\n",
    "        preds = list(G.predecessors(node))\n",
    "        depths[node] = 0 if not preds else 1 + max(depths[pred] for pred in preds)\n",
    "        G.nodes[node][\"depth\"] = depths[node]\n",
    "\n",
    "\n",
    "def compute_node_features(G, embeddings: Dict[str, np.ndarray]) -> torch.Tensor:\n",
    "    # unchanged semantics, returns torch tensor\n",
    "    arr = np.array([embeddings[n] for n in G.nodes], dtype=np.float64)\n",
    "    return torch.from_numpy(arr)\n",
    "\n",
    "\n",
    "def compute_structure_matrix(G) -> torch.Tensor:\n",
    "    D_np = np.array(nx.floyd_warshall_numpy(G), dtype=np.float64)\n",
    "    return torch.from_numpy(D_np)\n",
    "\n",
    "\n",
    "\n",
    "def _fuse_text_compact(node_ids: List[str], G: nx.DiGraph, compact_fusion: bool = True) -> str:\n",
    "    if not compact_fusion:\n",
    "        return \" | \".join([G.nodes[n][\"text\"] for n in node_ids])\n",
    "\n",
    "    texts_by_section = {}\n",
    "    for node_id in node_ids:\n",
    "        node_text = G.nodes[node_id][\"text\"]\n",
    "        if node_id.startswith(\"section_\"):\n",
    "            section_num = node_id.split(\"_\")[1]\n",
    "        else:\n",
    "            section_num = \"unknown\"\n",
    "        texts_by_section.setdefault(section_num, []).append((node_id, node_text))\n",
    "\n",
    "    fused_texts = []\n",
    "    def _safe_int(x):\n",
    "        try:\n",
    "            return int(x)\n",
    "        except Exception:\n",
    "            return 10**9\n",
    "\n",
    "    for section_num in sorted(texts_by_section.keys(), key=_safe_int):\n",
    "        section_items = texts_by_section[section_num]\n",
    "        section_items.sort(key=lambda item: (\n",
    "            _safe_int(item[0].split(\"_\")[3] if len(item[0].split(\"_\")) > 3 else 10**9),\n",
    "            _safe_int(item[0].split(\"_\")[5] if len(item[0].split(\"_\")) > 5 else 10**9),\n",
    "        ))\n",
    "        section_text = \" \".join([item[1] for item in section_items])\n",
    "        fused_texts.append(f\"From section_{section_num}: {section_text}\")\n",
    "    return \"\\n----\\n\".join(fused_texts)\n",
    "\n",
    "\n",
    "def _delete_rows_cols(M: torch.Tensor, indices_desc: List[int]) -> torch.Tensor:\n",
    "    \"\"\"\n",
    "    Delete rows/cols at positions in 'indices_desc' (sorted descending) exactly like np.delete used twice.\n",
    "    \"\"\"\n",
    "    keep = torch.ones(M.shape[0], dtype=torch.bool, device=M.device)\n",
    "    keep[indices_desc] = False\n",
    "    M2 = M[keep][:, keep]\n",
    "    return M2\n",
    "\n",
    "\n",
    "def test_fusion(tmp_set: List[str], candidate_set: List[str], G: nx.DiGraph, G_fus: nx.DiGraph,\n",
    "                map_index_node: Dict[str, int],\n",
    "                embedding_current_graph: List[torch.Tensor], dists_current_graph: List[torch.Tensor],\n",
    "                model: SentenceTransformer, current: str, depth: int, uuid_fus: str,\n",
    "                initial_prob: float, alpha: float, structure_distance: str,\n",
    "                compact_fusion: bool = False,\n",
    "                eps: float = 2e-2, sinkhorn_max_iter: int = 20, sinkhorn_tol: float = 1e-9\n",
    "               ) -> Tuple[float, List[torch.Tensor], List[torch.Tensor], nx.DiGraph, Dict[str, int]]:\n",
    "\n",
    "    new_embeddings_fus = [embedding_current_graph[0].clone()]\n",
    "    new_distance_struct = [dists_current_graph[0].clone()]\n",
    "    G_fus_copy = G_fus.copy()\n",
    "    map_index_node_copy = dict(map_index_node)\n",
    "\n",
    "    fused_text = _fuse_text_compact(tmp_set, G, compact_fusion)\n",
    "    tmp_node_id = f\"fused_{current}_{depth}_{uuid_fus}\"\n",
    "\n",
    "    # remove nodes in tmp_set (highest index first)\n",
    "    indices_to_remove = sorted([map_index_node_copy[n] for n in tmp_set], reverse=True)\n",
    "    if len(indices_to_remove) > 0:\n",
    "        new_embeddings_fus[0] = torch.vstack([\n",
    "            new_embeddings_fus[0][:min_idx]\n",
    "            if i == 0 else  # just to placate editor\n",
    "            new_embeddings_fus[0]\n",
    "            for i, min_idx in []\n",
    "        ]) if False else new_embeddings_fus[0]  # no-op placeholder to keep structure similar\n",
    "        new_embeddings_fus[0] = new_embeddings_fus[0][torch.tensor(\n",
    "            [i for i in range(new_embeddings_fus[0].shape[0]) if i not in set(indices_to_remove)],\n",
    "            dtype=torch.long, device=new_embeddings_fus[0].device\n",
    "        )]\n",
    "\n",
    "        new_distance_struct[0] = _delete_rows_cols(new_distance_struct[0], indices_to_remove)\n",
    "\n",
    "        # update indices map\n",
    "        for n2, idx in list(map_index_node_copy.items()):\n",
    "            for cut in indices_to_remove:\n",
    "                if idx > cut:\n",
    "                    idx -= 1\n",
    "            map_index_node_copy[n2] = idx\n",
    "\n",
    "    # add fused node in graph and embeddings\n",
    "    if tmp_node_id in G_fus_copy.nodes:\n",
    "        G_fus_copy.nodes[tmp_node_id][\"text\"] = fused_text\n",
    "    else:\n",
    "        G_fus_copy.add_node(tmp_node_id, text=fused_text, type=\"fused\")\n",
    "        # encode fused text\n",
    "        new_embedding = model.encode([fused_text], normalize_embeddings=True, convert_to_tensor=True).to(dtype=torch.float64)\n",
    "        new_embeddings_fus[0] = torch.cat([new_embeddings_fus[0], new_embedding], dim=0)\n",
    "\n",
    "        # extend distance matrix with penalty rows/cols\n",
    "        pen = torch.exp(torch.tensor(2.0, dtype=new_distance_struct[0].dtype, device=new_distance_struct[0].device)) * 1.5\n",
    "        num_nodes = new_distance_struct[0].shape[0]\n",
    "        col = torch.full((num_nodes, 1), pen, dtype=new_distance_struct[0].dtype, device=new_distance_struct[0].device)\n",
    "        row = torch.full((1, num_nodes + 1), pen, dtype=new_distance_struct[0].dtype, device=new_distance_struct[0].device)\n",
    "        new_distance_struct[0] = torch.cat([new_distance_struct[0], col], dim=1)\n",
    "        new_distance_struct[0] = torch.cat([new_distance_struct[0], row], dim=0)\n",
    "        new_distance_struct[0][-1, -1] = 0.0\n",
    "\n",
    "    # add edges for fused node\n",
    "    for n in tmp_set:\n",
    "        for gc in G.successors(n):\n",
    "            G_fus_copy.add_edge(\n",
    "                tmp_node_id, gc,\n",
    "                prob=G.edges[n, gc].get(\"prob\", initial_prob),\n",
    "                structure_distance=G.edges[n, gc].get(\"structure_distance\", 1.0)\n",
    "            )\n",
    "            if gc in map_index_node_copy:\n",
    "                new_distance_struct[0][-1, map_index_node_copy[gc]] = G.edges[n, gc].get(\"structure_distance\", 1.0)\n",
    "\n",
    "    # edge from current to fused node\n",
    "    new_prob = float(np.mean([G.edges[current, gc].get(\"prob\", initial_prob) for gc in tmp_set])) if tmp_set else initial_prob\n",
    "    new_structure_distance = float(np.mean([G.edges[current, gc].get(\"structure_distance\", 1.0) for gc in tmp_set])) if tmp_set else 1.0\n",
    "    G_fus_copy.add_edge(current, tmp_node_id, prob=new_prob, structure_distance=new_structure_distance)\n",
    "\n",
    "    if current in map_index_node_copy:\n",
    "        new_distance_struct[0][map_index_node_copy[current], -1] = new_structure_distance\n",
    "\n",
    "    # remove old nodes\n",
    "    for child_id in tmp_set:\n",
    "        if G_fus_copy.has_edge(current, child_id):\n",
    "            G_fus_copy.remove_edge(current, child_id)\n",
    "        if G_fus_copy.has_node(child_id):\n",
    "            G_fus_copy.remove_node(child_id)\n",
    "\n",
    "    # structure distances\n",
    "    if structure_distance != \"similarity_weighted\":\n",
    "        dists = compute_structure_distances([G_fus_copy])\n",
    "    else:\n",
    "        dists = new_distance_struct  # keep incremental matrix\n",
    "\n",
    "    # FGW distance\n",
    "    time_fgw = time.time()\n",
    "    fgw_dist, _ = compute_fgw(\n",
    "        embedding_current_graph[0], dists_current_graph[0],\n",
    "        new_embeddings_fus[0], dists[0], alpha=alpha,\n",
    "        eps=eps, sinkhorn_max_iter=sinkhorn_max_iter, sinkhorn_tol=sinkhorn_tol\n",
    "    )\n",
    "    \n",
    "    print(f\"[INFO] Time for the fgw computation : {time.time() - time_fgw:.4f} seconds\")\n",
    "\n",
    "    return fgw_dist, new_embeddings_fus, dists, G_fus_copy, map_index_node_copy\n",
    "\n",
    "\n",
    "def dichotomie_fusion(sorted_children_proba, candidate_set, candidate_vecs,\n",
    "                      G, G_fus, map_index_node,\n",
    "                      embedding_current_graph, dists_current_graph,\n",
    "                      model, current, depth, uuid_fus,\n",
    "                      initial_prob, alpha, structure_distance,\n",
    "                      distance_restante, compact_fusion=False, enable_logging=False,\n",
    "                      eps: float = 2e-2, sinkhorn_max_iter: int = 20, sinkhorn_tol: float = 1e-9):\n",
    "    \"\"\"\n",
    "    Binary search identical to original, but torch-based FGW calls.\n",
    "    \"\"\"\n",
    "    left, right = 1, len(sorted_children_proba)\n",
    "    best_k = 0\n",
    "    best_candidate_set = candidate_set\n",
    "    best_candidate_vecs = candidate_vecs[:]\n",
    "    best_embedding = embedding_current_graph\n",
    "    best_distance = dists_current_graph\n",
    "    best_G_fus = G_fus\n",
    "    best_map_index_node = dict(map_index_node)\n",
    "\n",
    "    while left <= right:\n",
    "        mid = (left + right) // 2\n",
    "        tmp_set = candidate_set + [cid for cid, _ in sorted_children_proba[:mid]]\n",
    "        tmp_vecs = candidate_vecs + [s for _, s in sorted_children_proba[:mid]]\n",
    "\n",
    "        fgw_dist, new_emb, new_dist, new_G_fus, map_index_node_copy = test_fusion(\n",
    "            tmp_set, candidate_set, G, G_fus, map_index_node,\n",
    "            embedding_current_graph, dists_current_graph,\n",
    "            model, current, depth, uuid_fus,\n",
    "            initial_prob, alpha, structure_distance, compact_fusion,\n",
    "            eps=eps, sinkhorn_max_iter=sinkhorn_max_iter, sinkhorn_tol=sinkhorn_tol\n",
    "        )\n",
    "        if enable_logging:\n",
    "            print(f\"[DEBUG] mid={mid}, fgw_dist={fgw_dist:.4f}, distance_restante={distance_restante:.4f}\")\n",
    "        if fgw_dist <= distance_restante:\n",
    "            best_k = mid\n",
    "            best_candidate_set = tmp_set\n",
    "            best_candidate_vecs = tmp_vecs\n",
    "            best_embedding = new_emb\n",
    "            best_distance = new_dist\n",
    "            best_G_fus = new_G_fus\n",
    "            best_map_index_node = map_index_node_copy\n",
    "            left = mid + 1\n",
    "        else:\n",
    "            right = mid - 1\n",
    "\n",
    "    if enable_logging:\n",
    "        #print(f\"[INFO] FGW distance: {fgw_dist:.4f}\")\n",
    "        print(f\"[INFO] Optimal set containing: {best_candidate_set} (FGW<=budget)\")\n",
    "        print(f\"[INFO] Total candidate set: {sorted_children_proba}\")\n",
    "\n",
    "    return best_candidate_set, best_candidate_vecs, best_embedding, best_distance, best_G_fus, best_map_index_node\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "56ba73fb-fc2c-433a-a878-0fa08fd411c7",
   "metadata": {},
   "outputs": [],
   "source": [
    "# -*- coding: utf-8 -*-\n",
    "\"\"\"\n",
    "Torch-based FGW traversal (genetic optimized) matching the original implementation.\n",
    "\"\"\"\n",
    "\n",
    "import time\n",
    "import uuid\n",
    "import numpy as np\n",
    "import torch\n",
    "import networkx as nx\n",
    "from typing import List, Dict, Optional, Tuple\n",
    "from pydantic import BaseModel, Field\n",
    "from sentence_transformers import SentenceTransformer\n",
    "\n",
    "\n",
    "# ===== Config (unchanged)\n",
    "class FGWConfig(BaseModel):\n",
    "    alpha: float = 0.5\n",
    "    max_depth: int = 3\n",
    "    sim_threshold: float = 0.8\n",
    "    fgw_threshold: float = 0.1\n",
    "    initial_prob: float = 0.8\n",
    "    initial_prob_new: float = 0.1\n",
    "    lr: float = 0.8\n",
    "    structure_distance: str = \"base\"  # \"base\" or \"similarity_weighted\"\n",
    "    compact_fusion: bool = True\n",
    "    enable_logging: bool = False\n",
    "\n",
    "\n",
    "def _log_if_enabled(message: str, enable_logging: bool, level: str = \"INFO\"):\n",
    "    if enable_logging:\n",
    "        print(f\"[{level}] {message}\")\n",
    "\n",
    "\n",
    "def _create_fused_text_compact(node_ids: List[str], G: nx.DiGraph, compact_fusion: bool = True) -> str:\n",
    "    if not compact_fusion:\n",
    "        return \" | \".join([G.nodes[n][\"text\"] for n in node_ids])\n",
    "\n",
    "    texts_by_section = {}\n",
    "    for node_id in node_ids:\n",
    "        node_text = G.nodes[node_id][\"text\"]\n",
    "        if node_id.startswith(\"section_\"):\n",
    "            section_num = node_id.split(\"_\")[1]\n",
    "        else:\n",
    "            section_num = \"unknown\"\n",
    "        texts_by_section.setdefault(section_num, []).append((node_id, node_text))\n",
    "\n",
    "    def _safe_int(x):\n",
    "        try:\n",
    "            return int(x)\n",
    "        except Exception:\n",
    "            return 10**9\n",
    "\n",
    "    fused_texts = []\n",
    "    for section_num in sorted(texts_by_section.keys(), key=_safe_int):\n",
    "        section_items = texts_by_section[section_num]\n",
    "        section_items.sort(key=lambda item: (\n",
    "            _safe_int(item[0].split(\"_\")[3] if len(item[0].split(\"_\")) > 3 else 10**9),\n",
    "            _safe_int(item[0].split(\"_\")[5] if len(item[0].split(\"_\")) > 5 else 10**9),\n",
    "        ))\n",
    "        section_text = \" \".join([item[1] for item in section_items])\n",
    "        fused_texts.append(f\"From section_{section_num}: {section_text}\")\n",
    "    return \"\\n----\\n\".join(fused_texts)\n",
    "\n",
    "\n",
    "def _clean_graph_dtypes(G: nx.DiGraph):\n",
    "    # Convert numpy/torch float types to Python float for safe serialization\n",
    "    for u, v, data in G.edges(data=True):\n",
    "        for key, value in list(data.items()):\n",
    "            if isinstance(value, (np.float32, np.float64)):\n",
    "                data[key] = float(value)\n",
    "            elif isinstance(value, torch.Tensor) and value.numel() == 1:\n",
    "                data[key] = float(value.item())\n",
    "    for n, data in G.nodes(data=True):\n",
    "        for key, value in list(data.items()):\n",
    "            if isinstance(value, (np.float32, np.float64)):\n",
    "                data[key] = float(value)\n",
    "            elif isinstance(value, torch.Tensor) and value.numel() == 1:\n",
    "                data[key] = float(value.item())\n",
    "\n",
    "\n",
    "def reward_distribution(edges_similarity: Dict[Tuple[str, str], float], reward: float, lr: float = 0.8) -> Optional[Dict[Tuple[str, str], float]]:\n",
    "    if not edges_similarity:\n",
    "        return None\n",
    "    vals = list(edges_similarity.values())\n",
    "    mean_similarity = float(np.mean(vals))\n",
    "    if mean_similarity == 0:\n",
    "        return None\n",
    "    updated_edges = {}\n",
    "    for edge, similarity in edges_similarity.items():\n",
    "        if similarity >= mean_similarity:\n",
    "            change = lr * (similarity - mean_similarity) * reward\n",
    "            updated_edges[edge] = float(change)\n",
    "    return updated_edges\n",
    "\n",
    "\n",
    "def recursive_traversal_with_score_fusion_fgw_genetic_optimized(\n",
    "    start_node: str,\n",
    "    question: str,\n",
    "    embeddings: EmbeddingStore,\n",
    "    G: nx.DiGraph,\n",
    "    model: SentenceTransformer,\n",
    "    max_depth: int = 2,\n",
    "    sim_threshold: float = 0.8,\n",
    "    fgw_threshold: float = 0.1,\n",
    "    alpha: float = 0.5,\n",
    "    initial_prob: float = 0.8,\n",
    "    initial_prob_new: float = 0.1,\n",
    "    lr: float = 0.8,\n",
    "    structure_distance: str = \"base\",\n",
    "    compact_fusion: bool = True,\n",
    "    enable_logging: bool = True,\n",
    "    *,\n",
    "    eps: float = 2e-2,\n",
    "    sinkhorn_max_iter: int = 20,\n",
    "    sinkhorn_tol: float = 1e-9\n",
    ") -> List[TraversalStep]:\n",
    "    \"\"\"\n",
    "    Torch version strictly following the original 'genetic optimized' algorithm.\n",
    "    \"\"\"\n",
    "    # Ensure all tensors are on the same device (GPU if available)\n",
    "    device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "    if enable_logging:\n",
    "        print(f\"🚀 Using device: {device}\")\n",
    "    \n",
    "    path: List[TraversalStep] = [TraversalStep(node_id=start_node, similarity=None)]\n",
    "    time_start = time.time()\n",
    "    current = start_node\n",
    "\n",
    "    # Encode query vector (normalized)\n",
    "\n",
    "    query_vec = model.encode(\n",
    "        [question],\n",
    "        normalize_embeddings=True,\n",
    "        convert_to_tensor=True\n",
    "    )[0].to(dtype=torch.float64, device=device)   \n",
    "\n",
    "    distance_restante = fgw_threshold\n",
    "\n",
    "    # Graph-wide embeddings (torch) - ensure GPU usage\n",
    "    embedding_current_graph = compute_embeddings([G], model=model, device=device)\n",
    "    map_index_node = {n: i for i, n in enumerate(G.nodes)}\n",
    "\n",
    "    # Structure distances according to mode\n",
    "    if structure_distance == \"similarity_weighted\":\n",
    "        dists_current_graph = compute_similarity_weighted_structure_distances([G], embedding_current_graph)\n",
    "        for u, v in G.edges():\n",
    "            G.edges[u, v][\"structure_distance\"] = float(dists_current_graph[0][map_index_node[u], map_index_node[v]].item())\n",
    "    else:\n",
    "        dists_current_graph = compute_structure_distances([G])\n",
    "\n",
    "    temps_wasted = 0.0\n",
    "\n",
    "    for depth in range(max_depth):\n",
    "        _log_if_enabled(f\"Starting depth {depth} with node {current}\", enable_logging)\n",
    "\n",
    "        children = list(G.successors(current))\n",
    "        if not children:\n",
    "            break\n",
    "\n",
    "        # Build child vectors from EmbeddingStore (may hold numpy); cast to torch64 on GPU\n",
    "        child_vecs = []\n",
    "        for c in children:\n",
    "            v = embeddings.vectors[c]\n",
    "            vt = torch.as_tensor(v, dtype=torch.float64, device=device)\n",
    "            child_vecs.append(vt)\n",
    "        child_mat = torch.stack(child_vecs, dim=0)\n",
    "        sims = (child_mat @ query_vec)  # dot since normalized\n",
    "\n",
    "        # sorting & relevant filters (keep exact logic/thresholding)\n",
    "        sims_np = sims.cpu().numpy()\n",
    "        sorted_children = sorted(zip(children, sims_np), key=lambda x: x[1], reverse=True)\n",
    "        max_sim = float(np.max(sims_np)) if len(sims_np) > 0 else 0.0\n",
    "        sorted_children_relevant = [c for c in sorted_children if c[1] > sim_threshold * max_sim]\n",
    "        # No use of proba since we only go through one piece of text once for this benchmark\n",
    "        sorted_children_proba = sorted_children_relevant\n",
    "        _log_if_enabled(f\"Relevant children: {[f'{c[0]}: {c[1]:.3f}' for c in sorted_children_relevant]}\", enable_logging)\n",
    "        _log_if_enabled(f\"Probability children: {[f'{c[0]}: {c[1]:.3f}' for c in sorted_children_proba]}\", enable_logging)\n",
    "\n",
    "        candidate_set: List[str] = []\n",
    "        candidate_vecs: List[float] = []\n",
    "        G_fus = G.copy()\n",
    "        _log_if_enabled(f\"Preprocessing time: {time.time() - time_start:.3f} seconds\", enable_logging)\n",
    "\n",
    "        uuid_fus = uuid.uuid4().hex[:8]\n",
    "        new_embedding_fus_etape_precedente = embedding_current_graph.copy()\n",
    "        new_distance_struct_etape_precedente = dists_current_graph.copy()\n",
    "\n",
    "        # === Binary search on fusion set size (exactly as original) ===\n",
    "        candidate_set, candidate_vecs, new_embedding_fus_etape_precedente, new_distance_struct_etape_precedente, G_fus, map_index_node_copy = dichotomie_fusion(\n",
    "            sorted_children_proba, candidate_set, candidate_vecs,\n",
    "            G, G_fus, map_index_node,\n",
    "            embedding_current_graph, dists_current_graph,\n",
    "            model, current, depth, uuid_fus,\n",
    "            initial_prob, alpha, structure_distance,\n",
    "            distance_restante, compact_fusion, enable_logging,\n",
    "            eps=eps, sinkhorn_max_iter=sinkhorn_max_iter, sinkhorn_tol=sinkhorn_tol\n",
    "        )\n",
    "\n",
    "        map_index_node = map_index_node_copy\n",
    "\n",
    "        if len(candidate_set) > 1:\n",
    "            time_start_fusion = time.time()\n",
    "            fused_text = _create_fused_text_compact(candidate_set, G, compact_fusion)\n",
    "            new_node_id = f\"fused_{current}_{depth}_{uuid.uuid4().hex[:8]}\"\n",
    "            G.add_node(new_node_id, text=fused_text, type=\"fused\")\n",
    "            # store embedding into EmbeddingStore\n",
    "            emb_new = model.encode([fused_text], normalize_embeddings=True, convert_to_tensor=True).to(dtype=torch.float64)\n",
    "            embeddings.vectors[new_node_id] = emb_new.cpu().numpy()  # keep exact behavior: EmbeddingStore stores np arrays\n",
    "\n",
    "            avg_prob = float(np.mean([G.edges[current, c].get(\"prob\", initial_prob) for c in candidate_set]))\n",
    "            avg_struct_dist = float(np.mean([G.edges[current, c].get(\"structure_distance\", 1.0) for c in candidate_set]))\n",
    "            G.add_edge(current, new_node_id, prob=avg_prob, structure_distance=avg_struct_dist)\n",
    "\n",
    "            for c in candidate_set:\n",
    "                for gc in G.successors(c):\n",
    "                    G.add_edge(new_node_id, gc,\n",
    "                               prob=G.edges[c, gc].get(\"prob\", initial_prob),\n",
    "                               structure_distance=G.edges[c, gc].get(\"structure_distance\", 1.0))\n",
    "                G.remove_edge(current, c)\n",
    "                G.remove_node(c)\n",
    "                _log_if_enabled(f\"Removed edge {current} -> {c} and node {c}\", enable_logging)\n",
    "\n",
    "            # update mappings\n",
    "            map_index_node[new_node_id] = len(G.nodes) - 1\n",
    "            embedding_current_graph = new_embedding_fus_etape_precedente.copy()\n",
    "            _log_if_enabled(f\"Fusion time: {time.time() - time_start_fusion:.3f} seconds\", enable_logging)\n",
    "\n",
    "            if structure_distance == \"similarity_weighted\":\n",
    "                dists_current_graph = new_distance_struct_etape_precedente.copy()\n",
    "            else:\n",
    "                dists_current_graph = compute_structure_distances([G])\n",
    "\n",
    "            # Remaining children → grandchildren scan & reward\n",
    "            remaining_children = sorted_children_proba[len(candidate_set):]\n",
    "            all_grandchildren = []\n",
    "            for c in remaining_children:\n",
    "                grandchildren = list(G.successors(c[0]))\n",
    "                all_grandchildren.extend([(c[0], gc) for gc in grandchildren])\n",
    "\n",
    "            if all_grandchildren:\n",
    "                grand_child_vecs = []\n",
    "                for (parent, gc) in all_grandchildren:\n",
    "                    v = embeddings.vectors[gc]\n",
    "                    vt = torch.as_tensor(v, dtype=torch.float64, device=device)\n",
    "                    grand_child_vecs.append(vt)\n",
    "                if grand_child_vecs:\n",
    "                    grand_child_mat = torch.stack(grand_child_vecs, dim=0)\n",
    "                    grand_child_sims = (grand_child_mat @ query_vec).cpu().numpy()\n",
    "                else:\n",
    "                    grand_child_sims = np.array([])\n",
    "\n",
    "                sorted_gc = sorted(zip(all_grandchildren, grand_child_sims), key=lambda x: x[1], reverse=True)\n",
    "                max_gc = float(np.max(grand_child_sims)) if len(grand_child_sims) > 0 else 0.0\n",
    "                sorted_gc_relevant = [c for c in sorted_gc if c[1] > sim_threshold * max_gc]\n",
    "                sorted_gc_proba = [c for c in sorted_gc if c[1] * G.edges[c[0][0], c[0][1]].get(\"prob\", 0.1) > sim_threshold * max_gc]\n",
    "\n",
    "                edge_to_consider: Dict[Tuple[str, str], float] = {}\n",
    "                for child in [gc[0][1] for gc in sorted_gc_relevant + sorted_gc_proba]:\n",
    "                    sim = float((torch.as_tensor(embeddings.vectors[child], dtype=torch.float64, device=device) @ query_vec).item())\n",
    "                    sim_transformed = float(np.exp(sim) / np.exp(1))\n",
    "                    if not G.has_edge(new_node_id, child):\n",
    "                        G.add_edge(new_node_id, child,\n",
    "                                   prob=initial_prob_new,\n",
    "                                   structure_distance=1.0 / (sim_transformed + 1e-6))\n",
    "                    edge_to_consider[(new_node_id, child)] = sim_transformed\n",
    "\n",
    "                rewarded_edges = reward_distribution(edge_to_consider, reward=5.0, lr=lr)\n",
    "                if rewarded_edges:\n",
    "                    for (u, v), change_prob in rewarded_edges.items():\n",
    "                        current_prob = G.edges[u, v].get(\"prob\", initial_prob_new)\n",
    "                        G.edges[u, v][\"prob\"] = min(current_prob + change_prob, 1.0)\n",
    "                        _log_if_enabled(f\"Updated edge {u}->{v} probability by {change_prob:.3f}\", enable_logging)\n",
    "\n",
    "            current = new_node_id\n",
    "            path.append(TraversalStep(node_id=current, similarity=float(np.mean(candidate_vecs)) if candidate_vecs else None))\n",
    "\n",
    "        else:\n",
    "            # No fusion → follow best child\n",
    "            best_idx = int(np.argmax(sims_np))\n",
    "            current = children[best_idx]\n",
    "            path.append(TraversalStep(node_id=current, similarity=float(sims_np[best_idx])))\n",
    "\n",
    "    _clean_graph_dtypes(G)\n",
    "    _log_if_enabled(f\"Total wasted time in calculations: {temps_wasted:.3f} seconds\", enable_logging)\n",
    "    return path\n",
    "\n",
    "\n",
    "# Convenience class kept for parity\n",
    "class FGWTraversal:\n",
    "    def __init__(self, config: FGWConfig):\n",
    "        self.config = config\n",
    "\n",
    "    def genetic_traversal(self, start_node: str, question: str, embeddings: EmbeddingStore,\n",
    "                          G: nx.DiGraph, model: SentenceTransformer) -> List[TraversalStep]:\n",
    "        return recursive_traversal_with_score_fusion_fgw_genetic_optimized(\n",
    "            start_node, question, embeddings, G, model,\n",
    "            max_depth=self.config.max_depth, sim_threshold=self.config.sim_threshold,\n",
    "            fgw_threshold=self.config.fgw_threshold, alpha=self.config.alpha,\n",
    "            initial_prob=self.config.initial_prob, initial_prob_new=self.config.initial_prob_new,\n",
    "            lr=self.config.lr, structure_distance=self.config.structure_distance,\n",
    "            compact_fusion=self.config.compact_fusion, enable_logging=self.config.enable_logging\n",
    "        )\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "cef9bbb4-ebb9-4e4e-8634-954051eb8827",
   "metadata": {},
   "outputs": [],
   "source": [
    "client = OpenAI(base_url=\"http://localhost:11434/v1\", api_key=\"ollama\")\n",
    "\n",
    "def ask_llm_strict(prompt, client):\n",
    "    response = client.chat.completions.create(\n",
    "        model=\"llama3\",\n",
    "        messages=[\n",
    "    {\"role\": \"system\", \"content\": \"You are a strict answer extractor. Only return the shortest possible answer.\"},\n",
    "    {\"role\": \"user\", \"content\": prompt},\n",
    "        ],\n",
    "        temperature=0.1,\n",
    "    )\n",
    "    return response.choices[0].message.content\n",
    "\n",
    "\n",
    "\n",
    "def build_EM_prompt_longbench(question, context, choices):\n",
    "    \"\"\"\n",
    "    Builds a prompt for LongBench-v2 multiple choice questions.\n",
    "    \"\"\"\n",
    "    choices_text = \"\"\n",
    "    for letter, choice in choices.items():\n",
    "        if choice.strip():  # Only if the choice is not empty\n",
    "            choices_text += f\"{letter}. {choice}\\n\"\n",
    "    \n",
    "    return f\"\"\"You are an extraction model specialized in multiple choice questions.\n",
    "\n",
    "You will be given a question, multiple choice options, and a context. Your task is to select the correct answer from the given choices based on the context.\n",
    "\n",
    "Instructions:\n",
    "- Read the context carefully\n",
    "- Analyze the question and all available choices\n",
    "- Select the letter (A, B, C, or D) that corresponds to the best answer\n",
    "- Return ONLY the letter of your chosen answer (A, B, C, or D)\n",
    "- Do not provide explanations or additional text\n",
    "\n",
    "---\n",
    "\n",
    "Context:\n",
    "{context}\n",
    "\n",
    "---\n",
    "\n",
    "Question: {question}\n",
    "\n",
    "Choices:\n",
    "{choices_text}\n",
    "\n",
    "Answer:\"\"\"\n",
    "\n",
    "\n",
    "def ask_llm_multiple_choice(prompt, client):\n",
    "    \"\"\"\n",
    "    Specialized version for multiple choice questions.\n",
    "    \"\"\"\n",
    "    response = client.chat.completions.create(\n",
    "        model=\"llama3\",\n",
    "        messages=[\n",
    "            {\"role\": \"system\", \"content\": \"You are a multiple choice question answering system. Only return the letter of the correct answer (A, B, C, or D).\"},\n",
    "            {\"role\": \"user\", \"content\": prompt},\n",
    "        ],\n",
    "        temperature=0.1,\n",
    "    )\n",
    "    # Clean the response to keep only the letter\n",
    "    answer = response.choices[0].message.content.strip().upper()\n",
    "    # Take only the first character if there's additional text\n",
    "    if answer and answer[0] in ['A', 'B', 'C', 'D']:\n",
    "        return answer[0]\n",
    "    return answer"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "51d6523e-f3ca-4c1a-b008-c7cdf839c254",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'\\n# 1. Génération et sauvegarde (à faire une seule fois)\\ndf = pd.read_json(\"hf://datasets/zai-org/LongBench-v2/data.json\")\\ngraphs, questions, choices, answers = generate_graphs_from_longbench_df(df, max_items=100)\\n\\n# 2. Chargement des données sauvegardées (pour les utilisations suivantes)\\ngraphs, questions, choices, answers = load_longbench_data()\\n\\n# 3. Affichage des statistiques\\nget_longbench_stats(graphs, questions, choices, answers)\\n'"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "def load_longbench_data(output_dir=\"/workspace/longbench-data\"):\n",
    "    \"\"\"\n",
    "    Loads pre-processed LongBench-v2 data from files.\n",
    "    \n",
    "    Args:\n",
    "        output_dir: directory containing the saved files\n",
    "    \n",
    "    Returns:\n",
    "        tuple: (graphs_by_id, questions_by_id, choices_by_id, answers_by_id)\n",
    "    \"\"\"\n",
    "    import pickle\n",
    "    import json\n",
    "    import os\n",
    "    \n",
    "    # Input files\n",
    "    graphs_file = os.path.join(output_dir, \"longbench_graphs.pkl\")\n",
    "    questions_file = os.path.join(output_dir, \"longbench_questions.json\")\n",
    "    choices_file = os.path.join(output_dir, \"longbench_choices.json\")\n",
    "    answers_file = os.path.join(output_dir, \"longbench_answers.json\")\n",
    "    \n",
    "    # Check that all files exist\n",
    "    required_files = [graphs_file, questions_file, choices_file, answers_file]\n",
    "    missing_files = [f for f in required_files if not os.path.exists(f)]\n",
    "    \n",
    "    if missing_files:\n",
    "        print(f\"Missing files: {missing_files}\")\n",
    "        print(\"Please first run generate_graphs_from_longbench_df() to create the files.\")\n",
    "        return None, None, None, None\n",
    "    \n",
    "    try:\n",
    "        print(\"Loading LongBench-v2 data...\")\n",
    "        \n",
    "        # Load graphs\n",
    "        print(\"- Loading graphs...\")\n",
    "        with open(graphs_file, 'rb') as f:\n",
    "            graphs_by_id = pickle.load(f)\n",
    "        \n",
    "        # Load metadata\n",
    "        print(\"- Loading questions...\")\n",
    "        with open(questions_file, 'r') as f:\n",
    "            questions_by_id = json.load(f)\n",
    "        \n",
    "        print(\"- Loading choices...\")\n",
    "        with open(choices_file, 'r') as f:\n",
    "            choices_by_id = json.load(f)\n",
    "        \n",
    "        print(\"- Loading answers...\")\n",
    "        with open(answers_file, 'r') as f:\n",
    "            answers_by_id = json.load(f)\n",
    "        \n",
    "        print(f\"✓ Data loaded successfully:\")\n",
    "        print(f\"  - {len(graphs_by_id)} graphs\")\n",
    "        print(f\"  - {len(questions_by_id)} questions\")\n",
    "        print(f\"  - {len(choices_by_id)} choice sets\")\n",
    "        print(f\"  - {len(answers_by_id)} answers\")\n",
    "\n",
    "        return graphs_by_id, questions_by_id, choices_by_id, answers_by_id\n",
    "        \n",
    "    except Exception as e:\n",
    "        print(f\"Error during loading: {e}\")\n",
    "        return None, None, None, None\n",
    "\n",
    "\n",
    "def get_longbench_stats(graphs_by_id, questions_by_id, choices_by_id, answers_by_id):\n",
    "    \"\"\"\n",
    "    Displays statistics about the loaded LongBench-v2 data.\n",
    "    \"\"\"\n",
    "    if not graphs_by_id:\n",
    "        print(\"No data to analyze.\")\n",
    "        return"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "04e97d85-ed0f-41c7-bfc2-3669600bf1d6",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Dataset loaded with 503 samples\n",
      "Columns: ['_id', 'domain', 'sub_domain', 'difficulty', 'length', 'question', 'choice_A', 'choice_B', 'choice_C', 'choice_D', 'answer', 'context']\n",
      "Sample domains: domain\n",
      "Single-Document QA                     175\n",
      "Multi-Document QA                      125\n",
      "Long In-context Learning                81\n",
      "Code Repository Understanding           50\n",
      "Long-dialogue History Understanding     39\n",
      "Name: count, dtype: int64\n",
      "Chargement des données LongBench-v2...\n",
      "- Chargement des graphes...\n",
      "- Chargement des questions...\n",
      "- Chargement des choix...\n",
      "- Chargement des réponses...\n",
      "✓ Données chargées avec succès!\n",
      "  - 100 graphes\n",
      "  - 100 questions\n",
      "  - 100 ensembles de choix\n",
      "  - 100 réponses\n",
      "qid: 66f36490821e116aacb2cc22\n",
      "🚀 Using device: cuda\n",
      "[INFO] Starting depth 0 with node document\n",
      "[INFO] Relevant children: ['section_89: 0.627', 'section_90: 0.551', 'section_92: 0.527', 'section_15: 0.521', 'section_21: 0.504', 'section_14: 0.495', 'section_20: 0.494', 'section_91: 0.491', 'section_11: 0.489', 'section_13: 0.489', 'section_0: 0.488', 'section_52: 0.487', 'section_1: 0.486', 'section_34: 0.479', 'section_7: 0.478', 'section_41: 0.478', 'section_36: 0.476', 'section_49: 0.474', 'section_79: 0.474', 'section_39: 0.474', 'section_12: 0.468', 'section_60: 0.467', 'section_94: 0.467', 'section_61: 0.467', 'section_43: 0.466', 'section_5: 0.465', 'section_80: 0.464', 'section_51: 0.461', 'section_47: 0.461', 'section_53: 0.461', 'section_66: 0.457', 'section_93: 0.455', 'section_45: 0.454', 'section_35: 0.451', 'section_48: 0.450', 'section_72: 0.450', 'section_59: 0.448', 'section_24: 0.447', 'section_95: 0.445', 'section_82: 0.443', 'section_8: 0.442', 'section_77: 0.442', 'section_22: 0.441', 'section_85: 0.440', 'section_42: 0.440']\n",
      "[INFO] Probability children: ['section_89: 0.627', 'section_90: 0.551', 'section_92: 0.527', 'section_15: 0.521', 'section_21: 0.504', 'section_14: 0.495', 'section_20: 0.494', 'section_91: 0.491', 'section_11: 0.489', 'section_13: 0.489', 'section_0: 0.488', 'section_52: 0.487', 'section_1: 0.486', 'section_34: 0.479', 'section_7: 0.478', 'section_41: 0.478', 'section_36: 0.476', 'section_49: 0.474', 'section_79: 0.474', 'section_39: 0.474', 'section_12: 0.468', 'section_60: 0.467', 'section_94: 0.467', 'section_61: 0.467', 'section_43: 0.466', 'section_5: 0.465', 'section_80: 0.464', 'section_51: 0.461', 'section_47: 0.461', 'section_53: 0.461', 'section_66: 0.457', 'section_93: 0.455', 'section_45: 0.454', 'section_35: 0.451', 'section_48: 0.450', 'section_72: 0.450', 'section_59: 0.448', 'section_24: 0.447', 'section_95: 0.445', 'section_82: 0.443', 'section_8: 0.442', 'section_77: 0.442', 'section_22: 0.441', 'section_85: 0.440', 'section_42: 0.440']\n",
      "[INFO] Preprocessing time: 1.012 seconds\n",
      "[INFO] Time for the fgw computation : 0.9344 seconds\n",
      "[DEBUG] mid=23, fgw_dist=0.0261, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 0.9633 seconds\n",
      "[DEBUG] mid=34, fgw_dist=0.0318, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 0.9335 seconds\n",
      "[DEBUG] mid=40, fgw_dist=0.0346, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 0.9321 seconds\n",
      "[DEBUG] mid=43, fgw_dist=0.0361, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 0.9522 seconds\n",
      "[DEBUG] mid=44, fgw_dist=0.0367, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 0.9309 seconds\n",
      "[DEBUG] mid=45, fgw_dist=0.0373, distance_restante=1.3000\n",
      "[INFO] Optimal set containing: ['section_89', 'section_90', 'section_92', 'section_15', 'section_21', 'section_14', 'section_20', 'section_91', 'section_11', 'section_13', 'section_0', 'section_52', 'section_1', 'section_34', 'section_7', 'section_41', 'section_36', 'section_49', 'section_79', 'section_39', 'section_12', 'section_60', 'section_94', 'section_61', 'section_43', 'section_5', 'section_80', 'section_51', 'section_47', 'section_53', 'section_66', 'section_93', 'section_45', 'section_35', 'section_48', 'section_72', 'section_59', 'section_24', 'section_95', 'section_82', 'section_8', 'section_77', 'section_22', 'section_85', 'section_42'] (FGW<=budget)\n",
      "[INFO] Total candidate set: [('section_89', np.float64(0.6267496550617933)), ('section_90', np.float64(0.551067514688607)), ('section_92', np.float64(0.527393473582852)), ('section_15', np.float64(0.5209869966150691)), ('section_21', np.float64(0.5042426662610824)), ('section_14', np.float64(0.49480933828350376)), ('section_20', np.float64(0.49405740183215086)), ('section_91', np.float64(0.49129264438826414)), ('section_11', np.float64(0.4891024195083264)), ('section_13', np.float64(0.48869800519600526)), ('section_0', np.float64(0.48838352858832956)), ('section_52', np.float64(0.4868527457432956)), ('section_1', np.float64(0.48573370594021126)), ('section_34', np.float64(0.4790674052886398)), ('section_7', np.float64(0.47841185917956336)), ('section_41', np.float64(0.4779669180121834)), ('section_36', np.float64(0.4759443023091984)), ('section_49', np.float64(0.4741211078433121)), ('section_79', np.float64(0.4740735385646635)), ('section_39', np.float64(0.4737202507195505)), ('section_12', np.float64(0.46816889186897526)), ('section_60', np.float64(0.4671592963791612)), ('section_94', np.float64(0.4670540108664893)), ('section_61', np.float64(0.46697365925965356)), ('section_43', np.float64(0.4663953429511987)), ('section_5', np.float64(0.4650753013488992)), ('section_80', np.float64(0.46393180862676453)), ('section_51', np.float64(0.461294276758036)), ('section_47', np.float64(0.46079962133828317)), ('section_53', np.float64(0.460748442435175)), ('section_66', np.float64(0.45711004360040286)), ('section_93', np.float64(0.4551322560303373)), ('section_45', np.float64(0.45379907286991705)), ('section_35', np.float64(0.4514573958886736)), ('section_48', np.float64(0.4500677225675518)), ('section_72', np.float64(0.449667513368372)), ('section_59', np.float64(0.448171275412217)), ('section_24', np.float64(0.44684747623397514)), ('section_95', np.float64(0.444823810195241)), ('section_82', np.float64(0.44262329479058166)), ('section_8', np.float64(0.44219053435991706)), ('section_77', np.float64(0.4415713859805333)), ('section_22', np.float64(0.440843443893062)), ('section_85', np.float64(0.4402176617313658)), ('section_42', np.float64(0.4398808569314656))]\n",
      "[INFO] Removed edge document -> section_89 and node section_89\n",
      "[INFO] Removed edge document -> section_90 and node section_90\n",
      "[INFO] Removed edge document -> section_92 and node section_92\n",
      "[INFO] Removed edge document -> section_15 and node section_15\n",
      "[INFO] Removed edge document -> section_21 and node section_21\n",
      "[INFO] Removed edge document -> section_14 and node section_14\n",
      "[INFO] Removed edge document -> section_20 and node section_20\n",
      "[INFO] Removed edge document -> section_91 and node section_91\n",
      "[INFO] Removed edge document -> section_11 and node section_11\n",
      "[INFO] Removed edge document -> section_13 and node section_13\n",
      "[INFO] Removed edge document -> section_0 and node section_0\n",
      "[INFO] Removed edge document -> section_52 and node section_52\n",
      "[INFO] Removed edge document -> section_1 and node section_1\n",
      "[INFO] Removed edge document -> section_34 and node section_34\n",
      "[INFO] Removed edge document -> section_7 and node section_7\n",
      "[INFO] Removed edge document -> section_41 and node section_41\n",
      "[INFO] Removed edge document -> section_36 and node section_36\n",
      "[INFO] Removed edge document -> section_49 and node section_49\n",
      "[INFO] Removed edge document -> section_79 and node section_79\n",
      "[INFO] Removed edge document -> section_39 and node section_39\n",
      "[INFO] Removed edge document -> section_12 and node section_12\n",
      "[INFO] Removed edge document -> section_60 and node section_60\n",
      "[INFO] Removed edge document -> section_94 and node section_94\n",
      "[INFO] Removed edge document -> section_61 and node section_61\n",
      "[INFO] Removed edge document -> section_43 and node section_43\n",
      "[INFO] Removed edge document -> section_5 and node section_5\n",
      "[INFO] Removed edge document -> section_80 and node section_80\n",
      "[INFO] Removed edge document -> section_51 and node section_51\n",
      "[INFO] Removed edge document -> section_47 and node section_47\n",
      "[INFO] Removed edge document -> section_53 and node section_53\n",
      "[INFO] Removed edge document -> section_66 and node section_66\n",
      "[INFO] Removed edge document -> section_93 and node section_93\n",
      "[INFO] Removed edge document -> section_45 and node section_45\n",
      "[INFO] Removed edge document -> section_35 and node section_35\n",
      "[INFO] Removed edge document -> section_48 and node section_48\n",
      "[INFO] Removed edge document -> section_72 and node section_72\n",
      "[INFO] Removed edge document -> section_59 and node section_59\n",
      "[INFO] Removed edge document -> section_24 and node section_24\n",
      "[INFO] Removed edge document -> section_95 and node section_95\n",
      "[INFO] Removed edge document -> section_82 and node section_82\n",
      "[INFO] Removed edge document -> section_8 and node section_8\n",
      "[INFO] Removed edge document -> section_77 and node section_77\n",
      "[INFO] Removed edge document -> section_22 and node section_22\n",
      "[INFO] Removed edge document -> section_85 and node section_85\n",
      "[INFO] Removed edge document -> section_42 and node section_42\n",
      "[INFO] Fusion time: 0.068 seconds\n",
      "[INFO] Starting depth 1 with node fused_document_0_2d17bd8a\n",
      "[INFO] Relevant children: ['section_89_para_4: 0.729', 'section_89_para_17: 0.708', 'section_53_para_24: 0.647', 'section_20_para_7: 0.638', 'section_60_para_21: 0.631', 'section_66_para_10: 0.626', 'section_89_para_15: 0.626', 'section_20_para_15: 0.622', 'section_52_para_11: 0.604', 'section_0_para_6: 0.602', 'section_89_para_19: 0.592', 'section_39_para_7: 0.591', 'section_93_para_6: 0.587', 'section_0_para_23: 0.587', 'section_47_para_7: 0.585', 'section_24_para_10: 0.585', 'section_8_para_9: 0.585', 'section_15_para_17: 0.584', 'section_5_para_15: 0.584', 'section_90_para_5: 0.582', 'section_48_para_19: 0.582', 'section_21_para_17: 0.581', 'section_52_para_12: 0.581', 'section_5_para_14: 0.579', 'section_92_para_7: 0.577', 'section_82_para_4: 0.576', 'section_13_para_26: 0.575', 'section_24_para_27: 0.574', 'section_61_para_7: 0.573', 'section_48_para_16: 0.571', 'section_13_para_4: 0.571', 'section_93_para_5: 0.570', 'section_14_para_7: 0.570', 'section_48_para_7: 0.568', 'section_60_para_8: 0.568', 'section_48_para_5: 0.566', 'section_20_para_8: 0.566', 'section_1_para_17: 0.565', 'section_52_para_13: 0.564', 'section_95_para_5: 0.563', 'section_85_para_8: 0.562', 'section_89_para_10: 0.562', 'section_39_para_13: 0.562', 'section_7_para_12: 0.561', 'section_48_para_14: 0.559', 'section_90_para_4: 0.559', 'section_90_para_27: 0.558', 'section_5_para_12: 0.557', 'section_43_para_13: 0.556', 'section_15_para_26: 0.556', 'section_89_para_11: 0.556', 'section_13_para_5: 0.555', 'section_14_para_16: 0.555', 'section_95_para_9: 0.554', 'section_89_para_5: 0.554', 'section_89_para_18: 0.554', 'section_34_para_15: 0.553', 'section_77_para_10: 0.553', 'section_94_para_21: 0.549', 'section_35_para_5: 0.548', 'section_80_para_15: 0.548', 'section_80_para_13: 0.547', 'section_20_para_10: 0.547', 'section_59_para_7: 0.545', 'section_0_para_25: 0.545', 'section_8_para_16: 0.544', 'section_89_para_9: 0.543', 'section_66_para_9: 0.543', 'section_47_para_6: 0.542', 'section_90_para_10: 0.542', 'section_8_para_11: 0.540', 'section_90_para_26: 0.540', 'section_77_para_15: 0.539', 'section_8_para_13: 0.538', 'section_24_para_17: 0.537', 'section_34_para_27: 0.536', 'section_12_para_9: 0.536', 'section_91_para_4: 0.534', 'section_5_para_10: 0.534', 'section_11_para_22: 0.534', 'section_8_para_4: 0.533', 'section_77_para_17: 0.533', 'section_59_para_8: 0.530', 'section_12_para_10: 0.530', 'section_93_para_14: 0.530', 'section_11_para_25: 0.530', 'section_92_para_15: 0.529', 'section_1_para_7: 0.529', 'section_80_para_21: 0.529', 'section_22_para_6: 0.529', 'section_90_para_9: 0.529', 'section_14_para_20: 0.528', 'section_41_para_17: 0.528', 'section_8_para_6: 0.527', 'section_21_para_24: 0.527', 'section_20_para_20: 0.527', 'section_5_para_8: 0.525', 'section_13_para_10: 0.524', 'section_92_para_13: 0.524', 'section_34_para_26: 0.524', 'section_80_para_17: 0.523', 'section_79_para_24: 0.521', 'section_82_para_8: 0.521', 'section_24_para_8: 0.521', 'section_12_para_26: 0.520', 'section_47_para_15: 0.520', 'section_77_para_6: 0.520', 'section_82_para_7: 0.519', 'section_53_para_11: 0.519', 'section_42_para_19: 0.517', 'section_79_para_9: 0.517', 'section_15_para_13: 0.517', 'section_12_para_11: 0.515', 'section_77_para_4: 0.515', 'section_61_para_6: 0.514', 'section_60_para_18: 0.513', 'section_0_para_5: 0.513', 'section_89_para_12: 0.513', 'section_21_para_14: 0.513', 'section_90_para_24: 0.513', 'section_15_para_5: 0.513', 'section_85_para_15: 0.513', 'section_90_para_17: 0.512', 'section_43_para_15: 0.511', 'section_53_para_9: 0.511', 'section_80_para_4: 0.511']\n",
      "[INFO] Probability children: ['section_89_para_4: 0.729', 'section_89_para_17: 0.708', 'section_53_para_24: 0.647', 'section_20_para_7: 0.638', 'section_60_para_21: 0.631', 'section_66_para_10: 0.626', 'section_89_para_15: 0.626', 'section_20_para_15: 0.622', 'section_52_para_11: 0.604', 'section_0_para_6: 0.602', 'section_89_para_19: 0.592', 'section_39_para_7: 0.591', 'section_93_para_6: 0.587', 'section_0_para_23: 0.587', 'section_47_para_7: 0.585', 'section_24_para_10: 0.585', 'section_8_para_9: 0.585', 'section_15_para_17: 0.584', 'section_5_para_15: 0.584', 'section_90_para_5: 0.582', 'section_48_para_19: 0.582', 'section_21_para_17: 0.581', 'section_52_para_12: 0.581', 'section_5_para_14: 0.579', 'section_92_para_7: 0.577', 'section_82_para_4: 0.576', 'section_13_para_26: 0.575', 'section_24_para_27: 0.574', 'section_61_para_7: 0.573', 'section_48_para_16: 0.571', 'section_13_para_4: 0.571', 'section_93_para_5: 0.570', 'section_14_para_7: 0.570', 'section_48_para_7: 0.568', 'section_60_para_8: 0.568', 'section_48_para_5: 0.566', 'section_20_para_8: 0.566', 'section_1_para_17: 0.565', 'section_52_para_13: 0.564', 'section_95_para_5: 0.563', 'section_85_para_8: 0.562', 'section_89_para_10: 0.562', 'section_39_para_13: 0.562', 'section_7_para_12: 0.561', 'section_48_para_14: 0.559', 'section_90_para_4: 0.559', 'section_90_para_27: 0.558', 'section_5_para_12: 0.557', 'section_43_para_13: 0.556', 'section_15_para_26: 0.556', 'section_89_para_11: 0.556', 'section_13_para_5: 0.555', 'section_14_para_16: 0.555', 'section_95_para_9: 0.554', 'section_89_para_5: 0.554', 'section_89_para_18: 0.554', 'section_34_para_15: 0.553', 'section_77_para_10: 0.553', 'section_94_para_21: 0.549', 'section_35_para_5: 0.548', 'section_80_para_15: 0.548', 'section_80_para_13: 0.547', 'section_20_para_10: 0.547', 'section_59_para_7: 0.545', 'section_0_para_25: 0.545', 'section_8_para_16: 0.544', 'section_89_para_9: 0.543', 'section_66_para_9: 0.543', 'section_47_para_6: 0.542', 'section_90_para_10: 0.542', 'section_8_para_11: 0.540', 'section_90_para_26: 0.540', 'section_77_para_15: 0.539', 'section_8_para_13: 0.538', 'section_24_para_17: 0.537', 'section_34_para_27: 0.536', 'section_12_para_9: 0.536', 'section_91_para_4: 0.534', 'section_5_para_10: 0.534', 'section_11_para_22: 0.534', 'section_8_para_4: 0.533', 'section_77_para_17: 0.533', 'section_59_para_8: 0.530', 'section_12_para_10: 0.530', 'section_93_para_14: 0.530', 'section_11_para_25: 0.530', 'section_92_para_15: 0.529', 'section_1_para_7: 0.529', 'section_80_para_21: 0.529', 'section_22_para_6: 0.529', 'section_90_para_9: 0.529', 'section_14_para_20: 0.528', 'section_41_para_17: 0.528', 'section_8_para_6: 0.527', 'section_21_para_24: 0.527', 'section_20_para_20: 0.527', 'section_5_para_8: 0.525', 'section_13_para_10: 0.524', 'section_92_para_13: 0.524', 'section_34_para_26: 0.524', 'section_80_para_17: 0.523', 'section_79_para_24: 0.521', 'section_82_para_8: 0.521', 'section_24_para_8: 0.521', 'section_12_para_26: 0.520', 'section_47_para_15: 0.520', 'section_77_para_6: 0.520', 'section_82_para_7: 0.519', 'section_53_para_11: 0.519', 'section_42_para_19: 0.517', 'section_79_para_9: 0.517', 'section_15_para_13: 0.517', 'section_12_para_11: 0.515', 'section_77_para_4: 0.515', 'section_61_para_6: 0.514', 'section_60_para_18: 0.513', 'section_0_para_5: 0.513', 'section_89_para_12: 0.513', 'section_21_para_14: 0.513', 'section_90_para_24: 0.513', 'section_15_para_5: 0.513', 'section_85_para_15: 0.513', 'section_90_para_17: 0.512', 'section_43_para_15: 0.511', 'section_53_para_9: 0.511', 'section_80_para_4: 0.511']\n",
      "[INFO] Preprocessing time: 7.757 seconds\n",
      "[INFO] Time for the fgw computation : 0.1327 seconds\n",
      "[DEBUG] mid=63, fgw_dist=0.3729, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 0.1586 seconds\n",
      "[DEBUG] mid=95, fgw_dist=0.3737, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 0.1690 seconds\n",
      "[DEBUG] mid=111, fgw_dist=0.3742, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 0.1076 seconds\n",
      "[DEBUG] mid=119, fgw_dist=0.3744, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 0.1605 seconds\n",
      "[DEBUG] mid=123, fgw_dist=0.3745, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 0.1070 seconds\n",
      "[DEBUG] mid=125, fgw_dist=0.3746, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 0.1595 seconds\n",
      "[DEBUG] mid=126, fgw_dist=0.3746, distance_restante=1.3000\n",
      "[INFO] Optimal set containing: ['section_89_para_4', 'section_89_para_17', 'section_53_para_24', 'section_20_para_7', 'section_60_para_21', 'section_66_para_10', 'section_89_para_15', 'section_20_para_15', 'section_52_para_11', 'section_0_para_6', 'section_89_para_19', 'section_39_para_7', 'section_93_para_6', 'section_0_para_23', 'section_47_para_7', 'section_24_para_10', 'section_8_para_9', 'section_15_para_17', 'section_5_para_15', 'section_90_para_5', 'section_48_para_19', 'section_21_para_17', 'section_52_para_12', 'section_5_para_14', 'section_92_para_7', 'section_82_para_4', 'section_13_para_26', 'section_24_para_27', 'section_61_para_7', 'section_48_para_16', 'section_13_para_4', 'section_93_para_5', 'section_14_para_7', 'section_48_para_7', 'section_60_para_8', 'section_48_para_5', 'section_20_para_8', 'section_1_para_17', 'section_52_para_13', 'section_95_para_5', 'section_85_para_8', 'section_89_para_10', 'section_39_para_13', 'section_7_para_12', 'section_48_para_14', 'section_90_para_4', 'section_90_para_27', 'section_5_para_12', 'section_43_para_13', 'section_15_para_26', 'section_89_para_11', 'section_13_para_5', 'section_14_para_16', 'section_95_para_9', 'section_89_para_5', 'section_89_para_18', 'section_34_para_15', 'section_77_para_10', 'section_94_para_21', 'section_35_para_5', 'section_80_para_15', 'section_80_para_13', 'section_20_para_10', 'section_59_para_7', 'section_0_para_25', 'section_8_para_16', 'section_89_para_9', 'section_66_para_9', 'section_47_para_6', 'section_90_para_10', 'section_8_para_11', 'section_90_para_26', 'section_77_para_15', 'section_8_para_13', 'section_24_para_17', 'section_34_para_27', 'section_12_para_9', 'section_91_para_4', 'section_5_para_10', 'section_11_para_22', 'section_8_para_4', 'section_77_para_17', 'section_59_para_8', 'section_12_para_10', 'section_93_para_14', 'section_11_para_25', 'section_92_para_15', 'section_1_para_7', 'section_80_para_21', 'section_22_para_6', 'section_90_para_9', 'section_14_para_20', 'section_41_para_17', 'section_8_para_6', 'section_21_para_24', 'section_20_para_20', 'section_5_para_8', 'section_13_para_10', 'section_92_para_13', 'section_34_para_26', 'section_80_para_17', 'section_79_para_24', 'section_82_para_8', 'section_24_para_8', 'section_12_para_26', 'section_47_para_15', 'section_77_para_6', 'section_82_para_7', 'section_53_para_11', 'section_42_para_19', 'section_79_para_9', 'section_15_para_13', 'section_12_para_11', 'section_77_para_4', 'section_61_para_6', 'section_60_para_18', 'section_0_para_5', 'section_89_para_12', 'section_21_para_14', 'section_90_para_24', 'section_15_para_5', 'section_85_para_15', 'section_90_para_17', 'section_43_para_15', 'section_53_para_9', 'section_80_para_4'] (FGW<=budget)\n",
      "[INFO] Total candidate set: [('section_89_para_4', np.float64(0.7290482646294127)), ('section_89_para_17', np.float64(0.7078441411396468)), ('section_53_para_24', np.float64(0.6472182666249885)), ('section_20_para_7', np.float64(0.6380584127118195)), ('section_60_para_21', np.float64(0.631041778137361)), ('section_66_para_10', np.float64(0.6262748415766486)), ('section_89_para_15', np.float64(0.6257371156837012)), ('section_20_para_15', np.float64(0.6217070505603016)), ('section_52_para_11', np.float64(0.6035887545398257)), ('section_0_para_6', np.float64(0.6024905690831917)), ('section_89_para_19', np.float64(0.592427529331644)), ('section_39_para_7', np.float64(0.5906881279418461)), ('section_93_para_6', np.float64(0.5868565977351723)), ('section_0_para_23', np.float64(0.5867912823253127)), ('section_47_para_7', np.float64(0.5853210074722147)), ('section_24_para_10', np.float64(0.5849105460999563)), ('section_8_para_9', np.float64(0.5845181760936324)), ('section_15_para_17', np.float64(0.5841343387695779)), ('section_5_para_15', np.float64(0.5837699940476109)), ('section_90_para_5', np.float64(0.5819664141290597)), ('section_48_para_19', np.float64(0.5816252761457392)), ('section_21_para_17', np.float64(0.5814332941222009)), ('section_52_para_12', np.float64(0.5809319144230378)), ('section_5_para_14', np.float64(0.579051238796177)), ('section_92_para_7', np.float64(0.576649229920761)), ('section_82_para_4', np.float64(0.5762085925487357)), ('section_13_para_26', np.float64(0.574632800254603)), ('section_24_para_27', np.float64(0.5739036291644547)), ('section_61_para_7', np.float64(0.5729569958607869)), ('section_48_para_16', np.float64(0.5714645964143639)), ('section_13_para_4', np.float64(0.5713685440940912)), ('section_93_para_5', np.float64(0.5703551587230207)), ('section_14_para_7', np.float64(0.5699686943918854)), ('section_48_para_7', np.float64(0.567949074229991)), ('section_60_para_8', np.float64(0.5677320225494782)), ('section_48_para_5', np.float64(0.566113769319849)), ('section_20_para_8', np.float64(0.5656171811118491)), ('section_1_para_17', np.float64(0.5651184609303151)), ('section_52_para_13', np.float64(0.5635881787401756)), ('section_95_para_5', np.float64(0.5627518044714759)), ('section_85_para_8', np.float64(0.5619901400826459)), ('section_89_para_10', np.float64(0.5616731615857504)), ('section_39_para_13', np.float64(0.5616614615786812)), ('section_7_para_12', np.float64(0.5612676733513167)), ('section_48_para_14', np.float64(0.559449937702573)), ('section_90_para_4', np.float64(0.5587435813167808)), ('section_90_para_27', np.float64(0.5575426798193056)), ('section_5_para_12', np.float64(0.5572811927016191)), ('section_43_para_13', np.float64(0.5564120607485568)), ('section_15_para_26', np.float64(0.5561580279715006)), ('section_89_para_11', np.float64(0.5557232887801133)), ('section_13_para_5', np.float64(0.5546537869844467)), ('section_14_para_16', np.float64(0.5545662444585682)), ('section_95_para_9', np.float64(0.5544243091430345)), ('section_89_para_5', np.float64(0.55438075925351)), ('section_89_para_18', np.float64(0.5539464274663826)), ('section_34_para_15', np.float64(0.5530646590243747)), ('section_77_para_10', np.float64(0.5527621840399782)), ('section_94_para_21', np.float64(0.5488765635328765)), ('section_35_para_5', np.float64(0.5480233511185907)), ('section_80_para_15', np.float64(0.5480221276000162)), ('section_80_para_13', np.float64(0.5471352440950668)), ('section_20_para_10', np.float64(0.5468662001094855)), ('section_59_para_7', np.float64(0.5448407103268569)), ('section_0_para_25', np.float64(0.544768867340156)), ('section_8_para_16', np.float64(0.5436125032495932)), ('section_89_para_9', np.float64(0.5430544741106219)), ('section_66_para_9', np.float64(0.542921662530614)), ('section_47_para_6', np.float64(0.5421958411888893)), ('section_90_para_10', np.float64(0.5416564471233076)), ('section_8_para_11', np.float64(0.540064070934095)), ('section_90_para_26', np.float64(0.5396124253245518)), ('section_77_para_15', np.float64(0.538914056938401)), ('section_8_para_13', np.float64(0.5375523982304438)), ('section_24_para_17', np.float64(0.5371007445245866)), ('section_34_para_27', np.float64(0.5357710942530163)), ('section_12_para_9', np.float64(0.5357281632043059)), ('section_91_para_4', np.float64(0.5339568400886666)), ('section_5_para_10', np.float64(0.533750063686873)), ('section_11_para_22', np.float64(0.5336915412602953)), ('section_8_para_4', np.float64(0.5329010546378592)), ('section_77_para_17', np.float64(0.5328143508643818)), ('section_59_para_8', np.float64(0.5302329225804379)), ('section_12_para_10', np.float64(0.5300116660611243)), ('section_93_para_14', np.float64(0.5299944064190354)), ('section_11_para_25', np.float64(0.5299515394203105)), ('section_92_para_15', np.float64(0.5294380238904216)), ('section_1_para_7', np.float64(0.5293221699786466)), ('section_80_para_21', np.float64(0.5292997489870799)), ('section_22_para_6', np.float64(0.5287619186309529)), ('section_90_para_9', np.float64(0.5285119930666592)), ('section_14_para_20', np.float64(0.5282423280058115)), ('section_41_para_17', np.float64(0.5278595197168714)), ('section_8_para_6', np.float64(0.5272238704177747)), ('section_21_para_24', np.float64(0.5271033489440705)), ('section_20_para_20', np.float64(0.5270707687669743)), ('section_5_para_8', np.float64(0.5252355536057369)), ('section_13_para_10', np.float64(0.5239204409343825)), ('section_92_para_13', np.float64(0.5238412002383552)), ('section_34_para_26', np.float64(0.5236008438957727)), ('section_80_para_17', np.float64(0.5234499051649)), ('section_79_para_24', np.float64(0.5210324141452852)), ('section_82_para_8', np.float64(0.5206044203321577)), ('section_24_para_8', np.float64(0.5205559480699031)), ('section_12_para_26', np.float64(0.5202038327124912)), ('section_47_para_15', np.float64(0.5200548399855331)), ('section_77_para_6', np.float64(0.5196406207168869)), ('section_82_para_7', np.float64(0.5190511357256234)), ('section_53_para_11', np.float64(0.5187381823531665)), ('section_42_para_19', np.float64(0.5172855073816769)), ('section_79_para_9', np.float64(0.5171762548073869)), ('section_15_para_13', np.float64(0.5170001948945931)), ('section_12_para_11', np.float64(0.5150540505082015)), ('section_77_para_4', np.float64(0.514602782440983)), ('section_61_para_6', np.float64(0.5137884352976573)), ('section_60_para_18', np.float64(0.513420286865271)), ('section_0_para_5', np.float64(0.5133836513528732)), ('section_89_para_12', np.float64(0.5132347466892375)), ('section_21_para_14', np.float64(0.5132173183488801)), ('section_90_para_24', np.float64(0.5131760540774735)), ('section_15_para_5', np.float64(0.5130546905475911)), ('section_85_para_15', np.float64(0.5129879570487663)), ('section_90_para_17', np.float64(0.5123306981410314)), ('section_43_para_15', np.float64(0.5114756697306908)), ('section_53_para_9', np.float64(0.5111979497618899)), ('section_80_para_4', np.float64(0.5106285869741215))]\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_89_para_4 and node section_89_para_4\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_89_para_17 and node section_89_para_17\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_53_para_24 and node section_53_para_24\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_20_para_7 and node section_20_para_7\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_60_para_21 and node section_60_para_21\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_66_para_10 and node section_66_para_10\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_89_para_15 and node section_89_para_15\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_20_para_15 and node section_20_para_15\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_52_para_11 and node section_52_para_11\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_0_para_6 and node section_0_para_6\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_89_para_19 and node section_89_para_19\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_39_para_7 and node section_39_para_7\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_93_para_6 and node section_93_para_6\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_0_para_23 and node section_0_para_23\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_47_para_7 and node section_47_para_7\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_24_para_10 and node section_24_para_10\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_8_para_9 and node section_8_para_9\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_15_para_17 and node section_15_para_17\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_5_para_15 and node section_5_para_15\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_90_para_5 and node section_90_para_5\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_48_para_19 and node section_48_para_19\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_21_para_17 and node section_21_para_17\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_52_para_12 and node section_52_para_12\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_5_para_14 and node section_5_para_14\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_92_para_7 and node section_92_para_7\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_82_para_4 and node section_82_para_4\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_13_para_26 and node section_13_para_26\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_24_para_27 and node section_24_para_27\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_61_para_7 and node section_61_para_7\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_48_para_16 and node section_48_para_16\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_13_para_4 and node section_13_para_4\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_93_para_5 and node section_93_para_5\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_14_para_7 and node section_14_para_7\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_48_para_7 and node section_48_para_7\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_60_para_8 and node section_60_para_8\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_48_para_5 and node section_48_para_5\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_20_para_8 and node section_20_para_8\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_1_para_17 and node section_1_para_17\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_52_para_13 and node section_52_para_13\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_95_para_5 and node section_95_para_5\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_85_para_8 and node section_85_para_8\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_89_para_10 and node section_89_para_10\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_39_para_13 and node section_39_para_13\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_7_para_12 and node section_7_para_12\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_48_para_14 and node section_48_para_14\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_90_para_4 and node section_90_para_4\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_90_para_27 and node section_90_para_27\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_5_para_12 and node section_5_para_12\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_43_para_13 and node section_43_para_13\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_15_para_26 and node section_15_para_26\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_89_para_11 and node section_89_para_11\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_13_para_5 and node section_13_para_5\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_14_para_16 and node section_14_para_16\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_95_para_9 and node section_95_para_9\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_89_para_5 and node section_89_para_5\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_89_para_18 and node section_89_para_18\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_34_para_15 and node section_34_para_15\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_77_para_10 and node section_77_para_10\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_94_para_21 and node section_94_para_21\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_35_para_5 and node section_35_para_5\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_80_para_15 and node section_80_para_15\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_80_para_13 and node section_80_para_13\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_20_para_10 and node section_20_para_10\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_59_para_7 and node section_59_para_7\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_0_para_25 and node section_0_para_25\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_8_para_16 and node section_8_para_16\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_89_para_9 and node section_89_para_9\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_66_para_9 and node section_66_para_9\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_47_para_6 and node section_47_para_6\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_90_para_10 and node section_90_para_10\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_8_para_11 and node section_8_para_11\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_90_para_26 and node section_90_para_26\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_77_para_15 and node section_77_para_15\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_8_para_13 and node section_8_para_13\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_24_para_17 and node section_24_para_17\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_34_para_27 and node section_34_para_27\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_12_para_9 and node section_12_para_9\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_91_para_4 and node section_91_para_4\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_5_para_10 and node section_5_para_10\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_11_para_22 and node section_11_para_22\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_8_para_4 and node section_8_para_4\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_77_para_17 and node section_77_para_17\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_59_para_8 and node section_59_para_8\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_12_para_10 and node section_12_para_10\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_93_para_14 and node section_93_para_14\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_11_para_25 and node section_11_para_25\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_92_para_15 and node section_92_para_15\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_1_para_7 and node section_1_para_7\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_80_para_21 and node section_80_para_21\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_22_para_6 and node section_22_para_6\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_90_para_9 and node section_90_para_9\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_14_para_20 and node section_14_para_20\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_41_para_17 and node section_41_para_17\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_8_para_6 and node section_8_para_6\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_21_para_24 and node section_21_para_24\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_20_para_20 and node section_20_para_20\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_5_para_8 and node section_5_para_8\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_13_para_10 and node section_13_para_10\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_92_para_13 and node section_92_para_13\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_34_para_26 and node section_34_para_26\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_80_para_17 and node section_80_para_17\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_79_para_24 and node section_79_para_24\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_82_para_8 and node section_82_para_8\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_24_para_8 and node section_24_para_8\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_12_para_26 and node section_12_para_26\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_47_para_15 and node section_47_para_15\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_77_para_6 and node section_77_para_6\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_82_para_7 and node section_82_para_7\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_53_para_11 and node section_53_para_11\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_42_para_19 and node section_42_para_19\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_79_para_9 and node section_79_para_9\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_15_para_13 and node section_15_para_13\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_12_para_11 and node section_12_para_11\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_77_para_4 and node section_77_para_4\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_61_para_6 and node section_61_para_6\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_60_para_18 and node section_60_para_18\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_0_para_5 and node section_0_para_5\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_89_para_12 and node section_89_para_12\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_21_para_14 and node section_21_para_14\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_90_para_24 and node section_90_para_24\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_15_para_5 and node section_15_para_5\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_85_para_15 and node section_85_para_15\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_90_para_17 and node section_90_para_17\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_43_para_15 and node section_43_para_15\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_53_para_9 and node section_53_para_9\n",
      "[INFO] Removed edge fused_document_0_2d17bd8a -> section_80_para_4 and node section_80_para_4\n",
      "[INFO] Fusion time: 0.018 seconds\n",
      "[INFO] Total wasted time in calculations: 0.000 seconds\n",
      "context: fused_fused_document_0_2d17bd8a_1_3b175ef1: From section_0: II. Fully Implementing the Judicial Accountability System............... 74 III. Advancing the Reform of Organizational Structure of Courts..... 86 Improving the Judicial Management System and the XI. Advancing the Construction of Intelligent Courts...................... 155\n",
      "----\n",
      "From section_1: the system of rule by law. Comprehensively deepening judicial reform of the judiciary, achieving fruitful results.\n",
      "----\n",
      "From section_5: the judicial system and fully implementing the judicial accountability system marks a new stage of the judicial system reform. Based on the realities of the Comprehensive and Supporting Reform of the Judicial System in the Courts 2019-2023 as an important program for instructing the people’s courts to deepen the comprehensive and supporting reform of the judicial\n",
      "----\n",
      "From section_7: arranging, and coordinating the judicial reform of courts, holding plenary\n",
      "----\n",
      "From section_8: II. Fully Implementing the Judicial Accountability System of the reform of the judicial system that one who tries a case shall have the the judicial accountability system in the people’s courts, establishing a courts nationwide to advance the reform of the judicial accountability further comprehensively implementing the judicial accountability system, of law, to promote full implementation of the judicial accountability\n",
      "----\n",
      "From section_11: of social services, setting out the scope, procedures, and standards for courts court management, logistics support, judicial transparency, informatization,\n",
      "----\n",
      "From section_12: courts with procedural and auxiliary judicial services. Improving the mechanism for regular handling of cases by court/ tribunal presidents. The courts nationwide have implemented the judge April 2017, the Supreme People’s Court issued opinions on implementation\n",
      "----\n",
      "From section_13: supervision and management mechanism to instruct the courts at all levels to improve the new supervision and management system. The courts at all the entire court, all staff, and whole process through informatization. The Improving the chief judge meeting system. Most of the courts at all levels\n",
      "----\n",
      "From section_14: in people’s courts to improve the rules of procedure of professional judge Court has formulated guidelines to strengthen the function of the judicial judicial committees on cases and the grounds therefor shall be made public\n",
      "----\n",
      "From section_15: submitted to the judicial committees in the people’s courts at all levels for all courts in Hainan, since the launch of the reform of judicial committee search report, and the like. The Supreme People’s Court has established the system of guiding cases, and the like. Hainan Higher People’s Court\n",
      "----\n",
      "From section_20: and functional system of courts is an important part and goal of the judicial reform of the people’s courts, and an important support for the courts have actively promoted the reform of organizational system and Setting up Circuit Courts of the Supreme People’s Court. At the end People’s Court, as standing local judicial organs dispatched by the Supreme\n",
      "----\n",
      "From section_21: playing an important role in improving the socialist judicial system with Enhancing the construction of a specialized IP judicial system. In order courts over cases, and providing guidelines on the appointment of IP judges,\n",
      "----\n",
      "From section_22: cases. In addition, the Supreme People’s Court has also promoted the\n",
      "----\n",
      "From section_24: Setting up Internet courts in Hangzhou, Beijing and Guangzhou. actively address the judicial needs in the Internet era and implement the of Internet Courts. Internet Courts have actively promoted the “online the Internet Courts have successfully and efficiently adjudicated a number of\n",
      "----\n",
      "From section_34: people’s courts at all levels,ensuring the whole process of adjudicating reflect modern judicial civilization. On April 13, 2016, the Supreme People’s Court promulgated the newly amended Court Rules of People’s Courts of the\n",
      "----\n",
      "From section_35: in order to maintain court order, strengthen judicial protection of human\n",
      "----\n",
      "From section_39: people’s courts. The people’s courts have been reforming the system of people and make the people have a stronger sense of gain in the judicial\n",
      "----\n",
      "From section_41: the Supreme People’s Court promulgated the guidelines on promoting the\n",
      "----\n",
      "From section_42: resolution. Most courts nationwide have been carrying out reforms into this\n",
      "----\n",
      "From section_43: in modernizing the governance. In June 2016, the Supreme People’s Court Dispute Resolution Mechanisms in People’s Courts, proposing a “three-\n",
      "----\n",
      "From section_47: the allocation of judicial resources, to innovate and improve the working mechanism, and to alleviate the caseloads. The Supreme People’s Court improve judicial efficiency. Most primary courts in Jiangsu have established\n",
      "----\n",
      "From section_48: involving lawsuits. The Supreme People’s Court has been actively with the law. The courts at all levels have been improving the working alleviates people’s burden. The Supreme People’s Court has launched an courts at four levels nationwide, enabling the Supreme People’s Court, local Court has preliminarily established a national platform for courts to\n",
      "----\n",
      "From section_52: actively developed the structure of courts relying mainly on central courts and supplemented by community courts and circuit adjudication venues, and optimized the regional layout of people’s courts and distribution of judicial\n",
      "----\n",
      "From section_53: People’s Congress, the Supreme People’s Court proposed to “basically solve the Supreme People’s Court issued the Roadmap for Basically Solving was proposed, the people’s courts have comprehensively promoted the\n",
      "----\n",
      "From section_59: power within the people’s courts has been advanced actively and steadily. The Supreme People’s Court has promulgated opinions on improving\n",
      "----\n",
      "From section_60: People’s Court has been simultaneously promoting the construction of four Promoting the openness of judicial process. In November 2014, the China information about the judicial process of the courts nationwide, providing\n",
      "----\n",
      "From section_61: process online. In March 2018, the Supreme People’s Court promulgated provisions on the disclosure of judicial process by the people’s courts\n",
      "----\n",
      "From section_66: on judicial cases, striving to become a new platform for case studies. The people’s courts at all levels have been making efforts to improve judicial\n",
      "----\n",
      "From section_77: IX. Improving the System and Mechanism of Judicial Service The people’s courts shoulder an important mission for protecting the people’s courts at all levels have deepened the reform of the judicial system Enabling the mechanism of judicial service and protection for the documents on providing judicial protection for improving the business\n",
      "----\n",
      "From section_79: improving the judicial protection of property rights. By upholding the IP Cases, and proposed to improve the IP judicial system by improving the\n",
      "----\n",
      "From section_80: Supreme People’s Court issued outlines of judicial protection of intellectual Improving the system and mechanism of judicial protection for to provide judicial protection for comprehensively promoting the have strengthened the establishment of specialized judicial organs for courts and 257 primary people’s courts had established specialized judicial\n",
      "----\n",
      "From section_82: X. Improving the Judicial Management System and the Government, the Supreme People’s Court has promoted the reform of judicial management system, adjusted the jurisdiction system, improved\n",
      "----\n",
      "From section_85: over administrative cases, instructing certain higher people’s courts to, to some designated primary or intermediate people’s courts other than the\n",
      "----\n",
      "From section_89: XI. Advancing the Construction of Intelligent Courts Since 2013, the people’s courts have conscientiously implemented the courts. The open, and intelligent online Apps have been comprehensively developed, and the main framework of court informatization version 3.0 has been established, which greatly promotes the modernization of the judicial system and judicial capability. Development Plan on Informatization of People’s Courts 2016-2020, intelligent courts. In accordance with the guidelines of “systematic projects, standards first”, the Supreme People’s Court has improved the system of standards for informatization of the people’s courts, developed and released\n",
      "----\n",
      "From section_90: for People’s courts (2015) and other normative documents to implement code-based management of 3,500 courts nationwide, built a three-level case security system. The courts at all levels have been constantly upgrading and improving the court network systems to support online handling of all recognition in process, and other functions. The Supreme People’s Court Fully promoting electronic litigation. For further development in the the courts at all levels have been vigorously promoting electronic litigation for whole-process online. The Supreme People’s Court has been instructing\n",
      "----\n",
      "From section_91: and promoting the courts nationwide to deploy five online standard modules\n",
      "----\n",
      "From section_92: Strengthening the intelligent assistance in case trial and judicial handling and the intelligent assistance in case trial for judges. Relying on has generated the information about cases files of courts nationwide, which\n",
      "----\n",
      "From section_93: decision making. The Supreme People’s Court has built a big database to collect, manage, and analyze the judicial information from the courts 2016, the courts nationwide fully realized the integration of judicial statistics\n",
      "----\n",
      "From section_94: be finished. In the next step, the people’s courts will, follow the guidance\n",
      "----\n",
      "From section_95: and justice in each judicial case, make the fair, efficient and authoritative law, advance the judicial civilization to a higher level, and strive to make the\n",
      "B\n",
      "Question 1: 66f36490821e116aacb2cc22\n",
      "Predicted: B, Ground Truth: D\n",
      "Correct: ✗\n",
      "\n",
      "=== RÉSULTATS FINAUX ===\n",
      "Total traité: 1\n",
      "Réponses correctes: 0\n",
      "Accuracy: 0.000 (0.0%)\n"
     ]
    }
   ],
   "source": [
    "# Load of LongBench-v2 dataset\n",
    "import pandas as pd\n",
    "import time\n",
    "# Login using e.g. `huggingface-cli login` to access this dataset\n",
    "df = pd.read_json(\"hf://datasets/zai-org/LongBench-v2/data.json\")\n",
    "\n",
    "print(f\"Dataset loaded with {len(df)} samples\")\n",
    "print(f\"Columns: {df.columns.tolist()}\")\n",
    "print(f\"Sample domains: {df['domain'].value_counts().head()}\")\n",
    "\n",
    "# Graph generation from LongBench-v2 dataset\n",
    "\"\"\"\n",
    "graphs, questions, choices, ground_truth_answers = generate_graphs_from_longbench_df(\n",
    "    df, start_index=0, max_items=100  # Limité à 100 pour test, enlever max_items pour tout traiter\n",
    ")\n",
    "\"\"\"\n",
    "\n",
    "graphs, questions, choices, ground_truth_answers = load_longbench_data()\n",
    "\n",
    "\n",
    "# Alternative: LLM use for testing purposes\n",
    "# context, questions, choices, ground_truth_answers = llm_only_longbench_df(\n",
    "#     df, start_index=0, max_items=100\n",
    "# )\n",
    "\n",
    "answers = {}\n",
    "i = 0\n",
    "\n",
    "for qid, G in graphs.items():\n",
    "\n",
    "        if qid != \"66f36490821e116aacb2cc22\":\n",
    "            continue\n",
    "        print(f'qid: {qid}')\n",
    "            \n",
    "        time_start = time.time()\n",
    "\n",
    "        if len(G.nodes) == 0:\n",
    "            raise ValueError(\"Graphe vide\")\n",
    "\n",
    "        embeddings = {n: model.encode(G.nodes[n][\"text\"], normalize_embeddings=True) for n in G.nodes}\n",
    "        embedding_store = EmbeddingStore(vectors=embeddings)\n",
    "        question = questions[qid]\n",
    "        question_choices = choices[qid]\n",
    "\n",
    "        path_with_scores = recursive_traversal_with_score_fusion_fgw_genetic_optimized(\n",
    "            \"document\", question, embedding_store, G, model,\n",
    "            sim_threshold=0.7, fgw_threshold=1.3, alpha=0.8,\n",
    "            structure_distance='similarity_weighted'\n",
    "        )\n",
    "\n",
    "        node_ids = [nid for nid in path_with_scores]\n",
    "        last_step = node_ids[-1]  # TraversalStep object\n",
    "        last_node_id = last_step.node_id\n",
    "\n",
    "        context = last_node_id + \": \" + G.nodes[last_node_id][\"text\"]\n",
    "        print(f\"context: {context}\")\n",
    "        prompt = build_EM_prompt_longbench(question, context, question_choices)\n",
    "        \n",
    "        answer = ask_llm_multiple_choice(prompt, client)\n",
    "        print(answer)\n",
    "\n",
    "\n",
    "        answers[qid] = answer\n",
    "        ground_truth = ground_truth_answers[qid]\n",
    "        \n",
    "        print(f\"Question {i+1}: {qid}\")\n",
    "        print(f\"Predicted: {answer}, Ground Truth: {ground_truth}\")\n",
    "        print(f\"Correct: {'✓' if answer == ground_truth else '✗'}\")\n",
    "        \n",
    "        i += 1\n",
    "\n",
    "        # Save each 10 iterations\n",
    "        if i % 10 == 0:\n",
    "            results = {\n",
    "                \"answers\": answers,\n",
    "                \"ground_truth\": ground_truth_answers,\n",
    "                \"metadata\": {\n",
    "                    \"dataset\": \"LongBench-v2\",\n",
    "                    \"method\": \"graph_fusion_fgw\",\n",
    "                    \"total_processed\": i\n",
    "                }\n",
    "            }\n",
    "            with open(\"/workspace/longbench-data/longbench_results.json\", \"w\") as f:\n",
    "                json.dump(results, f, indent=2)\n",
    "\n",
    "# Final Save\n",
    "results = {\n",
    "    \"answers\": answers,\n",
    "    \"ground_truth\": ground_truth_answers,\n",
    "    \"metadata\": {\n",
    "        \"dataset\": \"LongBench-v2\",\n",
    "        \"method\": \"graph_fusion_fgw\",\n",
    "        \"total_processed\": i\n",
    "    }\n",
    "}\n",
    "\n",
    "# Accuracy\n",
    "correct = sum(1 for qid in answers if answers[qid] == ground_truth_answers[qid])\n",
    "total = len(answers)\n",
    "accuracy = correct / total if total > 0 else 0\n",
    "\n",
    "results[\"metadata\"][\"accuracy\"] = accuracy\n",
    "results[\"metadata\"][\"correct_answers\"] = correct\n",
    "results[\"metadata\"][\"total_answers\"] = total\n",
    "\n",
    "print(f\"\\n=== Final Results ===\")\n",
    "print(f\"Total processed: {total}\")\n",
    "print(f\"Correct answers: {correct}\")\n",
    "print(f\"Accuracy: {accuracy:.3f} ({accuracy*100:.1f}%)\")\n",
    "\n",
    "with open(\"/workspace/longbench-data/longbench_results_final.json\", \"w\") as f:\n",
    "    json.dump(results, f, indent=2)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "341300a8-8606-42c1-93dc-1257c1cedb80",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Dataset loaded with 503 samples\n",
      "Columns: ['_id', 'domain', 'sub_domain', 'difficulty', 'length', 'question', 'choice_A', 'choice_B', 'choice_C', 'choice_D', 'answer', 'context']\n",
      "Sample domains: domain\n",
      "Single-Document QA                     175\n",
      "Multi-Document QA                      125\n",
      "Long In-context Learning                81\n",
      "Code Repository Understanding           50\n",
      "Long-dialogue History Understanding     39\n",
      "Name: count, dtype: int64\n",
      "Chargement des données LongBench-v2...\n",
      "- Chargement des graphes...\n",
      "- Chargement des questions...\n",
      "- Chargement des choix...\n",
      "- Chargement des réponses...\n",
      "✓ Données chargées avec succès!\n",
      "  - 100 graphes\n",
      "  - 100 questions\n",
      "  - 100 ensembles de choix\n",
      "  - 100 réponses\n",
      "qid: 66f36490821e116aacb2cc22\n",
      "🚀 Using device: cuda\n",
      "[INFO] Starting depth 0 with node document\n",
      "[INFO] Relevant children: ['section_89: 0.627', 'section_90: 0.551', 'section_92: 0.527', 'section_15: 0.521', 'section_21: 0.504', 'section_14: 0.495', 'section_20: 0.494', 'section_91: 0.491', 'section_11: 0.489', 'section_13: 0.489', 'section_0: 0.488', 'section_52: 0.487', 'section_1: 0.486', 'section_34: 0.479', 'section_7: 0.478', 'section_41: 0.478', 'section_36: 0.476', 'section_49: 0.474', 'section_79: 0.474', 'section_39: 0.474', 'section_12: 0.468', 'section_60: 0.467', 'section_94: 0.467', 'section_61: 0.467', 'section_43: 0.466', 'section_5: 0.465', 'section_80: 0.464', 'section_51: 0.461', 'section_47: 0.461', 'section_53: 0.461', 'section_66: 0.457', 'section_93: 0.455', 'section_45: 0.454', 'section_35: 0.451', 'section_48: 0.450', 'section_72: 0.450', 'section_59: 0.448', 'section_24: 0.447', 'section_95: 0.445', 'section_82: 0.443', 'section_8: 0.442', 'section_77: 0.442', 'section_22: 0.441', 'section_85: 0.440', 'section_42: 0.440', 'section_3: 0.436', 'section_65: 0.434', 'section_9: 0.432', 'section_27: 0.431', 'section_83: 0.431', 'section_38: 0.430', 'section_69: 0.430', 'section_19: 0.430', 'section_23: 0.430', 'section_28: 0.429', 'section_37: 0.428', 'section_40: 0.428', 'section_86: 0.428', 'section_71: 0.425', 'section_75: 0.422', 'section_17: 0.422', 'section_10: 0.421', 'section_18: 0.420', 'section_78: 0.409', 'section_73: 0.408', 'section_25: 0.408', 'section_68: 0.404', 'section_55: 0.403', 'section_67: 0.396', 'section_58: 0.392', 'section_50: 0.391', 'section_54: 0.387', 'section_87: 0.383', 'section_4: 0.382', 'section_29: 0.382', 'section_57: 0.382', 'section_64: 0.382', 'section_81: 0.381', 'section_44: 0.380', 'section_6: 0.375', 'section_63: 0.373', 'section_70: 0.373', 'section_2: 0.372', 'section_84: 0.370', 'section_46: 0.360', 'section_62: 0.360', 'section_76: 0.344', 'section_26: 0.343', 'section_33: 0.342', 'section_74: 0.341', 'section_16: 0.334', 'section_30: 0.330', 'section_31: 0.330', 'section_56: 0.303', 'section_32: 0.288', 'section_88: 0.269']\n",
      "[INFO] Probability children: ['section_89: 0.627', 'section_90: 0.551', 'section_92: 0.527', 'section_15: 0.521', 'section_21: 0.504', 'section_14: 0.495', 'section_20: 0.494', 'section_91: 0.491', 'section_11: 0.489', 'section_13: 0.489', 'section_0: 0.488', 'section_52: 0.487', 'section_1: 0.486', 'section_34: 0.479', 'section_7: 0.478', 'section_41: 0.478', 'section_36: 0.476', 'section_49: 0.474', 'section_79: 0.474', 'section_39: 0.474', 'section_12: 0.468', 'section_60: 0.467', 'section_94: 0.467', 'section_61: 0.467', 'section_43: 0.466', 'section_5: 0.465', 'section_80: 0.464', 'section_51: 0.461', 'section_47: 0.461', 'section_53: 0.461', 'section_66: 0.457', 'section_93: 0.455', 'section_45: 0.454', 'section_35: 0.451', 'section_48: 0.450', 'section_72: 0.450', 'section_59: 0.448', 'section_24: 0.447', 'section_95: 0.445', 'section_82: 0.443', 'section_8: 0.442', 'section_77: 0.442', 'section_22: 0.441', 'section_85: 0.440', 'section_42: 0.440', 'section_3: 0.436', 'section_65: 0.434', 'section_9: 0.432', 'section_27: 0.431', 'section_83: 0.431', 'section_38: 0.430', 'section_69: 0.430', 'section_19: 0.430', 'section_23: 0.430', 'section_28: 0.429', 'section_37: 0.428', 'section_40: 0.428', 'section_86: 0.428', 'section_71: 0.425', 'section_75: 0.422', 'section_17: 0.422', 'section_10: 0.421', 'section_18: 0.420', 'section_78: 0.409', 'section_73: 0.408', 'section_25: 0.408', 'section_68: 0.404', 'section_55: 0.403', 'section_67: 0.396', 'section_58: 0.392', 'section_50: 0.391', 'section_54: 0.387', 'section_87: 0.383', 'section_4: 0.382', 'section_29: 0.382', 'section_57: 0.382', 'section_64: 0.382', 'section_81: 0.381', 'section_44: 0.380', 'section_6: 0.375', 'section_63: 0.373', 'section_70: 0.373', 'section_2: 0.372', 'section_84: 0.370', 'section_46: 0.360', 'section_62: 0.360', 'section_76: 0.344', 'section_26: 0.343', 'section_33: 0.342', 'section_74: 0.341', 'section_16: 0.334', 'section_30: 0.330', 'section_31: 0.330', 'section_56: 0.303', 'section_32: 0.288', 'section_88: 0.269']\n",
      "[INFO] Preprocessing time: 1.023 seconds\n",
      "[INFO] Time for the fgw computation : 56.6404 seconds\n",
      "[DEBUG] mid=48, fgw_dist=0.0415, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 17.3246 seconds\n",
      "[DEBUG] mid=72, fgw_dist=0.0549, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 25.8835 seconds\n",
      "[DEBUG] mid=84, fgw_dist=0.0609, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 23.9069 seconds\n",
      "[DEBUG] mid=90, fgw_dist=0.0637, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 60.0979 seconds\n",
      "[DEBUG] mid=93, fgw_dist=0.0652, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 40.7508 seconds\n",
      "[DEBUG] mid=95, fgw_dist=0.0663, distance_restante=1.3000\n",
      "[INFO] Time for the fgw computation : 40.8653 seconds\n",
      "[DEBUG] mid=96, fgw_dist=0.0665, distance_restante=1.3000\n",
      "[INFO] FGW distance: 0.0665\n",
      "[INFO] Optimal set containing: ['section_89', 'section_90', 'section_92', 'section_15', 'section_21', 'section_14', 'section_20', 'section_91', 'section_11', 'section_13', 'section_0', 'section_52', 'section_1', 'section_34', 'section_7', 'section_41', 'section_36', 'section_49', 'section_79', 'section_39', 'section_12', 'section_60', 'section_94', 'section_61', 'section_43', 'section_5', 'section_80', 'section_51', 'section_47', 'section_53', 'section_66', 'section_93', 'section_45', 'section_35', 'section_48', 'section_72', 'section_59', 'section_24', 'section_95', 'section_82', 'section_8', 'section_77', 'section_22', 'section_85', 'section_42', 'section_3', 'section_65', 'section_9', 'section_27', 'section_83', 'section_38', 'section_69', 'section_19', 'section_23', 'section_28', 'section_37', 'section_40', 'section_86', 'section_71', 'section_75', 'section_17', 'section_10', 'section_18', 'section_78', 'section_73', 'section_25', 'section_68', 'section_55', 'section_67', 'section_58', 'section_50', 'section_54', 'section_87', 'section_4', 'section_29', 'section_57', 'section_64', 'section_81', 'section_44', 'section_6', 'section_63', 'section_70', 'section_2', 'section_84', 'section_46', 'section_62', 'section_76', 'section_26', 'section_33', 'section_74', 'section_16', 'section_30', 'section_31', 'section_56', 'section_32', 'section_88'] (FGW<=budget)\n",
      "[INFO] Total candidate set: [('section_89', np.float64(0.6267496550617933)), ('section_90', np.float64(0.551067514688607)), ('section_92', np.float64(0.527393473582852)), ('section_15', np.float64(0.5209869966150691)), ('section_21', np.float64(0.5042426662610824)), ('section_14', np.float64(0.49480933828350376)), ('section_20', np.float64(0.49405740183215086)), ('section_91', np.float64(0.49129264438826414)), ('section_11', np.float64(0.4891024195083264)), ('section_13', np.float64(0.48869800519600526)), ('section_0', np.float64(0.48838352858832956)), ('section_52', np.float64(0.4868527457432956)), ('section_1', np.float64(0.48573370594021126)), ('section_34', np.float64(0.4790674052886398)), ('section_7', np.float64(0.47841185917956336)), ('section_41', np.float64(0.4779669180121834)), ('section_36', np.float64(0.4759443023091984)), ('section_49', np.float64(0.4741211078433121)), ('section_79', np.float64(0.4740735385646635)), ('section_39', np.float64(0.4737202507195505)), ('section_12', np.float64(0.46816889186897526)), ('section_60', np.float64(0.4671592963791612)), ('section_94', np.float64(0.4670540108664893)), ('section_61', np.float64(0.46697365925965356)), ('section_43', np.float64(0.4663953429511987)), ('section_5', np.float64(0.4650753013488992)), ('section_80', np.float64(0.46393180862676453)), ('section_51', np.float64(0.461294276758036)), ('section_47', np.float64(0.46079962133828317)), ('section_53', np.float64(0.460748442435175)), ('section_66', np.float64(0.45711004360040286)), ('section_93', np.float64(0.4551322560303373)), ('section_45', np.float64(0.45379907286991705)), ('section_35', np.float64(0.4514573958886736)), ('section_48', np.float64(0.4500677225675518)), ('section_72', np.float64(0.449667513368372)), ('section_59', np.float64(0.448171275412217)), ('section_24', np.float64(0.44684747623397514)), ('section_95', np.float64(0.444823810195241)), ('section_82', np.float64(0.44262329479058166)), ('section_8', np.float64(0.44219053435991706)), ('section_77', np.float64(0.4415713859805333)), ('section_22', np.float64(0.440843443893062)), ('section_85', np.float64(0.4402176617313658)), ('section_42', np.float64(0.4398808569314656)), ('section_3', np.float64(0.4362338881041904)), ('section_65', np.float64(0.4343147445187952)), ('section_9', np.float64(0.4322435857242268)), ('section_27', np.float64(0.4311951118088315)), ('section_83', np.float64(0.4306694686841649)), ('section_38', np.float64(0.4304001046901278)), ('section_69', np.float64(0.4299666544451012)), ('section_19', np.float64(0.4296989947330434)), ('section_23', np.float64(0.4295626890107457)), ('section_28', np.float64(0.42948623638570416)), ('section_37', np.float64(0.4284740976249529)), ('section_40', np.float64(0.4282361412140222)), ('section_86', np.float64(0.42778006999470053)), ('section_71', np.float64(0.425447557070723)), ('section_75', np.float64(0.4217047501968426)), ('section_17', np.float64(0.4216154577964416)), ('section_10', np.float64(0.4212769309231213)), ('section_18', np.float64(0.4198410500787423)), ('section_78', np.float64(0.4087304133952099)), ('section_73', np.float64(0.4084795026666712)), ('section_25', np.float64(0.40791755103929883)), ('section_68', np.float64(0.40407972338683573)), ('section_55', np.float64(0.40294487870415646)), ('section_67', np.float64(0.3963178776263938)), ('section_58', np.float64(0.39239802475605284)), ('section_50', np.float64(0.3906383279724917)), ('section_54', np.float64(0.38718798662841064)), ('section_87', np.float64(0.3827449903645266)), ('section_4', np.float64(0.3823643763929041)), ('section_29', np.float64(0.3822573813493908)), ('section_57', np.float64(0.3819748510222575)), ('section_64', np.float64(0.38191527616382837)), ('section_81', np.float64(0.38059869468714463)), ('section_44', np.float64(0.3803292135623325)), ('section_6', np.float64(0.37463058218745837)), ('section_63', np.float64(0.37305240069294254)), ('section_70', np.float64(0.37294365583551525)), ('section_2', np.float64(0.3721443203073328)), ('section_84', np.float64(0.37035426201645105)), ('section_46', np.float64(0.36040781817088763)), ('section_62', np.float64(0.36012331231417094)), ('section_76', np.float64(0.34387554901993894)), ('section_26', np.float64(0.34285768496870306)), ('section_33', np.float64(0.34176731949734684)), ('section_74', np.float64(0.34094344778368707)), ('section_16', np.float64(0.3341447951203772)), ('section_30', np.float64(0.3304378281434418)), ('section_31', np.float64(0.33008892278755647)), ('section_56', np.float64(0.3029413460738459)), ('section_32', np.float64(0.2882635662918868)), ('section_88', np.float64(0.26862404985070776))]\n",
      "[INFO] Removed edge document -> section_89 and node section_89\n",
      "[INFO] Removed edge document -> section_90 and node section_90\n",
      "[INFO] Removed edge document -> section_92 and node section_92\n",
      "[INFO] Removed edge document -> section_15 and node section_15\n",
      "[INFO] Removed edge document -> section_21 and node section_21\n",
      "[INFO] Removed edge document -> section_14 and node section_14\n",
      "[INFO] Removed edge document -> section_20 and node section_20\n",
      "[INFO] Removed edge document -> section_91 and node section_91\n",
      "[INFO] Removed edge document -> section_11 and node section_11\n",
      "[INFO] Removed edge document -> section_13 and node section_13\n",
      "[INFO] Removed edge document -> section_0 and node section_0\n",
      "[INFO] Removed edge document -> section_52 and node section_52\n",
      "[INFO] Removed edge document -> section_1 and node section_1\n",
      "[INFO] Removed edge document -> section_34 and node section_34\n",
      "[INFO] Removed edge document -> section_7 and node section_7\n",
      "[INFO] Removed edge document -> section_41 and node section_41\n",
      "[INFO] Removed edge document -> section_36 and node section_36\n",
      "[INFO] Removed edge document -> section_49 and node section_49\n",
      "[INFO] Removed edge document -> section_79 and node section_79\n",
      "[INFO] Removed edge document -> section_39 and node section_39\n",
      "[INFO] Removed edge document -> section_12 and node section_12\n",
      "[INFO] Removed edge document -> section_60 and node section_60\n",
      "[INFO] Removed edge document -> section_94 and node section_94\n",
      "[INFO] Removed edge document -> section_61 and node section_61\n",
      "[INFO] Removed edge document -> section_43 and node section_43\n",
      "[INFO] Removed edge document -> section_5 and node section_5\n",
      "[INFO] Removed edge document -> section_80 and node section_80\n",
      "[INFO] Removed edge document -> section_51 and node section_51\n",
      "[INFO] Removed edge document -> section_47 and node section_47\n",
      "[INFO] Removed edge document -> section_53 and node section_53\n",
      "[INFO] Removed edge document -> section_66 and node section_66\n",
      "[INFO] Removed edge document -> section_93 and node section_93\n",
      "[INFO] Removed edge document -> section_45 and node section_45\n",
      "[INFO] Removed edge document -> section_35 and node section_35\n",
      "[INFO] Removed edge document -> section_48 and node section_48\n",
      "[INFO] Removed edge document -> section_72 and node section_72\n",
      "[INFO] Removed edge document -> section_59 and node section_59\n",
      "[INFO] Removed edge document -> section_24 and node section_24\n",
      "[INFO] Removed edge document -> section_95 and node section_95\n",
      "[INFO] Removed edge document -> section_82 and node section_82\n",
      "[INFO] Removed edge document -> section_8 and node section_8\n",
      "[INFO] Removed edge document -> section_77 and node section_77\n",
      "[INFO] Removed edge document -> section_22 and node section_22\n",
      "[INFO] Removed edge document -> section_85 and node section_85\n",
      "[INFO] Removed edge document -> section_42 and node section_42\n",
      "[INFO] Removed edge document -> section_3 and node section_3\n",
      "[INFO] Removed edge document -> section_65 and node section_65\n",
      "[INFO] Removed edge document -> section_9 and node section_9\n",
      "[INFO] Removed edge document -> section_27 and node section_27\n",
      "[INFO] Removed edge document -> section_83 and node section_83\n",
      "[INFO] Removed edge document -> section_38 and node section_38\n",
      "[INFO] Removed edge document -> section_69 and node section_69\n",
      "[INFO] Removed edge document -> section_19 and node section_19\n",
      "[INFO] Removed edge document -> section_23 and node section_23\n",
      "[INFO] Removed edge document -> section_28 and node section_28\n",
      "[INFO] Removed edge document -> section_37 and node section_37\n",
      "[INFO] Removed edge document -> section_40 and node section_40\n",
      "[INFO] Removed edge document -> section_86 and node section_86\n",
      "[INFO] Removed edge document -> section_71 and node section_71\n",
      "[INFO] Removed edge document -> section_75 and node section_75\n",
      "[INFO] Removed edge document -> section_17 and node section_17\n",
      "[INFO] Removed edge document -> section_10 and node section_10\n",
      "[INFO] Removed edge document -> section_18 and node section_18\n",
      "[INFO] Removed edge document -> section_78 and node section_78\n",
      "[INFO] Removed edge document -> section_73 and node section_73\n",
      "[INFO] Removed edge document -> section_25 and node section_25\n",
      "[INFO] Removed edge document -> section_68 and node section_68\n",
      "[INFO] Removed edge document -> section_55 and node section_55\n",
      "[INFO] Removed edge document -> section_67 and node section_67\n",
      "[INFO] Removed edge document -> section_58 and node section_58\n",
      "[INFO] Removed edge document -> section_50 and node section_50\n",
      "[INFO] Removed edge document -> section_54 and node section_54\n",
      "[INFO] Removed edge document -> section_87 and node section_87\n",
      "[INFO] Removed edge document -> section_4 and node section_4\n",
      "[INFO] Removed edge document -> section_29 and node section_29\n",
      "[INFO] Removed edge document -> section_57 and node section_57\n",
      "[INFO] Removed edge document -> section_64 and node section_64\n",
      "[INFO] Removed edge document -> section_81 and node section_81\n",
      "[INFO] Removed edge document -> section_44 and node section_44\n",
      "[INFO] Removed edge document -> section_6 and node section_6\n",
      "[INFO] Removed edge document -> section_63 and node section_63\n",
      "[INFO] Removed edge document -> section_70 and node section_70\n",
      "[INFO] Removed edge document -> section_2 and node section_2\n",
      "[INFO] Removed edge document -> section_84 and node section_84\n",
      "[INFO] Removed edge document -> section_46 and node section_46\n",
      "[INFO] Removed edge document -> section_62 and node section_62\n",
      "[INFO] Removed edge document -> section_76 and node section_76\n",
      "[INFO] Removed edge document -> section_26 and node section_26\n",
      "[INFO] Removed edge document -> section_33 and node section_33\n",
      "[INFO] Removed edge document -> section_74 and node section_74\n",
      "[INFO] Removed edge document -> section_16 and node section_16\n",
      "[INFO] Removed edge document -> section_30 and node section_30\n",
      "[INFO] Removed edge document -> section_31 and node section_31\n",
      "[INFO] Removed edge document -> section_56 and node section_56\n",
      "[INFO] Removed edge document -> section_32 and node section_32\n",
      "[INFO] Removed edge document -> section_88 and node section_88\n",
      "[INFO] Fusion time: 0.119 seconds\n",
      "[INFO] Starting depth 1 with node fused_document_0_04551f57\n",
      "[INFO] Relevant children: ['section_89_para_4: 0.729', 'section_89_para_17: 0.708', 'section_53_para_24: 0.647', 'section_20_para_7: 0.638', 'section_60_para_21: 0.631', 'section_40_para_17: 0.628', 'section_66_para_10: 0.626', 'section_89_para_15: 0.626', 'section_20_para_15: 0.622', 'section_27_para_16: 0.619', 'section_3_para_9: 0.612', 'section_18_para_9: 0.609', 'section_52_para_11: 0.604', 'section_0_para_6: 0.602', 'section_89_para_19: 0.592', 'section_39_para_7: 0.591', 'section_27_para_4: 0.587', 'section_93_para_6: 0.587', 'section_0_para_23: 0.587', 'section_47_para_7: 0.585', 'section_10_para_20: 0.585', 'section_24_para_10: 0.585', 'section_8_para_9: 0.585', 'section_15_para_17: 0.584', 'section_5_para_15: 0.584', 'section_90_para_5: 0.582', 'section_48_para_19: 0.582', 'section_21_para_17: 0.581', 'section_52_para_12: 0.581', 'section_5_para_14: 0.579', 'section_92_para_7: 0.577', 'section_82_para_4: 0.576', 'section_13_para_26: 0.575', 'section_24_para_27: 0.574', 'section_61_para_7: 0.573', 'section_67_para_15: 0.572', 'section_48_para_16: 0.571', 'section_13_para_4: 0.571', 'section_93_para_5: 0.570', 'section_14_para_7: 0.570', 'section_4_para_20: 0.569', 'section_48_para_7: 0.568', 'section_60_para_8: 0.568', 'section_48_para_5: 0.566', 'section_20_para_8: 0.566', 'section_1_para_17: 0.565', 'section_78_para_4: 0.565', 'section_3_para_22: 0.564', 'section_52_para_13: 0.564', 'section_95_para_5: 0.563', 'section_85_para_8: 0.562', 'section_89_para_10: 0.562', 'section_39_para_13: 0.562', 'section_7_para_12: 0.561', 'section_75_para_26: 0.560', 'section_2_para_23: 0.560', 'section_48_para_14: 0.559', 'section_90_para_4: 0.559', 'section_40_para_27: 0.559', 'section_90_para_27: 0.558', 'section_5_para_12: 0.557', 'section_43_para_13: 0.556', 'section_2_para_11: 0.556', 'section_15_para_26: 0.556', 'section_89_para_11: 0.556', 'section_13_para_5: 0.555', 'section_14_para_16: 0.555', 'section_95_para_9: 0.554', 'section_89_para_5: 0.554', 'section_89_para_18: 0.554', 'section_34_para_15: 0.553', 'section_77_para_10: 0.553', 'section_75_para_10: 0.553', 'section_46_para_19: 0.552', 'section_17_para_7: 0.551', 'section_30_para_15: 0.551', 'section_94_para_21: 0.549', 'section_37_para_7: 0.549', 'section_2_para_22: 0.548', 'section_35_para_5: 0.548', 'section_80_para_15: 0.548', 'section_78_para_7: 0.548', 'section_80_para_13: 0.547', 'section_83_para_26: 0.547', 'section_20_para_10: 0.547', 'section_73_para_25: 0.546', 'section_65_para_23: 0.545', 'section_59_para_7: 0.545', 'section_0_para_25: 0.545', 'section_8_para_16: 0.544', 'section_89_para_9: 0.543', 'section_66_para_9: 0.543', 'section_47_para_6: 0.542', 'section_90_para_10: 0.542', 'section_84_para_23: 0.542', 'section_37_para_14: 0.541', 'section_54_para_20: 0.541', 'section_8_para_11: 0.540', 'section_90_para_26: 0.540', 'section_77_para_15: 0.539', 'section_37_para_13: 0.539', 'section_8_para_13: 0.538', 'section_19_para_4: 0.538', 'section_24_para_17: 0.537', 'section_44_para_16: 0.537', 'section_9_para_20: 0.536', 'section_16_para_9: 0.536', 'section_46_para_26: 0.536', 'section_34_para_27: 0.536', 'section_12_para_9: 0.536', 'section_86_para_17: 0.534', 'section_91_para_4: 0.534', 'section_37_para_12: 0.534', 'section_44_para_12: 0.534', 'section_46_para_17: 0.534', 'section_5_para_10: 0.534', 'section_11_para_22: 0.534', 'section_84_para_7: 0.534', 'section_8_para_4: 0.533', 'section_77_para_17: 0.533', 'section_3_para_21: 0.533', 'section_37_para_20: 0.532', 'section_9_para_21: 0.531', 'section_59_para_8: 0.530', 'section_12_para_10: 0.530', 'section_93_para_14: 0.530', 'section_11_para_25: 0.530', 'section_92_para_15: 0.529', 'section_1_para_7: 0.529', 'section_80_para_21: 0.529', 'section_22_para_6: 0.529', 'section_90_para_9: 0.529', 'section_56_para_25: 0.528', 'section_14_para_20: 0.528', 'section_37_para_5: 0.528', 'section_41_para_17: 0.528', 'section_17_para_15: 0.527', 'section_8_para_6: 0.527', 'section_21_para_24: 0.527', 'section_20_para_20: 0.527', 'section_73_para_16: 0.526', 'section_68_para_21: 0.525', 'section_5_para_8: 0.525', 'section_63_para_27: 0.524', 'section_13_para_10: 0.524', 'section_92_para_13: 0.524', 'section_34_para_26: 0.524', 'section_80_para_17: 0.523', 'section_25_para_22: 0.523', 'section_78_para_8: 0.522', 'section_56_para_23: 0.521', 'section_79_para_24: 0.521', 'section_82_para_8: 0.521', 'section_24_para_8: 0.521', 'section_12_para_26: 0.520', 'section_47_para_15: 0.520', 'section_77_para_6: 0.520', 'section_3_para_16: 0.519', 'section_73_para_14: 0.519', 'section_82_para_7: 0.519', 'section_53_para_11: 0.519', 'section_71_para_16: 0.518', 'section_29_para_10: 0.518', 'section_10_para_23: 0.518', 'section_42_para_19: 0.517', 'section_79_para_9: 0.517', 'section_15_para_13: 0.517', 'section_58_para_14: 0.516', 'section_6_para_4: 0.516', 'section_19_para_7: 0.516', 'section_12_para_11: 0.515', 'section_4_para_16: 0.515', 'section_77_para_4: 0.515', 'section_61_para_6: 0.514', 'section_57_para_7: 0.514', 'section_70_para_12: 0.513', 'section_60_para_18: 0.513', 'section_0_para_5: 0.513', 'section_89_para_12: 0.513', 'section_21_para_14: 0.513', 'section_90_para_24: 0.513', 'section_15_para_5: 0.513', 'section_85_para_15: 0.513', 'section_90_para_17: 0.512', 'section_43_para_15: 0.511', 'section_68_para_7: 0.511', 'section_53_para_9: 0.511', 'section_44_para_10: 0.511', 'section_73_para_22: 0.511', 'section_80_para_4: 0.511', 'section_85_para_11: 0.510', 'section_77_para_16: 0.510', 'section_94_para_18: 0.509', 'section_0_para_20: 0.508', 'section_62_para_26: 0.508', 'section_21_para_9: 0.508', 'section_24_para_15: 0.508', 'section_90_para_14: 0.507', 'section_21_para_5: 0.507', 'section_3_para_5: 0.507', 'section_25_para_8: 0.507', 'section_86_para_4: 0.507', 'section_24_para_20: 0.506', 'section_36_para_13: 0.506', 'section_2_para_8: 0.506', 'section_65_para_15: 0.505', 'section_20_para_5: 0.504', 'section_83_para_9: 0.504', 'section_7_para_17: 0.504', 'section_76_para_9: 0.504', 'section_14_para_27: 0.503', 'section_39_para_12: 0.503', 'section_64_para_18: 0.502', 'section_7_para_15: 0.502', 'section_80_para_6: 0.502', 'section_11_para_12: 0.502', 'section_52_para_10: 0.502', 'section_60_para_10: 0.502', 'section_35_para_18: 0.502', 'section_92_para_10: 0.502', 'section_71_para_13: 0.502', 'section_3_para_8: 0.501', 'section_7_para_16: 0.501', 'section_20_para_24: 0.501', 'section_7_para_10: 0.501', 'section_92_para_16: 0.501', 'section_47_para_21: 0.501', 'section_60_para_12: 0.500', 'section_87_para_15: 0.500', 'section_20_para_11: 0.500', 'section_48_para_24: 0.500', 'section_24_para_9: 0.499', 'section_14_para_15: 0.499', 'section_79_para_7: 0.499', 'section_51_para_26: 0.499', 'section_4_para_24: 0.499', 'section_18_para_14: 0.499', 'section_9_para_24: 0.499', 'section_7_para_19: 0.498', 'section_69_para_10: 0.498', 'section_37_para_24: 0.497', 'section_41_para_18: 0.497', 'section_72_para_18: 0.497', 'section_2_para_13: 0.497', 'section_46_para_18: 0.497', 'section_56_para_18: 0.496', 'section_39_para_6: 0.496', 'section_53_para_14: 0.496', 'section_62_para_5: 0.496', 'section_75_para_24: 0.495', 'section_92_para_17: 0.495', 'section_2_para_18: 0.495', 'section_15_para_21: 0.495', 'section_59_para_20: 0.495', 'section_13_para_6: 0.495', 'section_79_para_5: 0.495', 'section_49_para_11: 0.495', 'section_37_para_6: 0.495', 'section_68_para_4: 0.493', 'section_8_para_17: 0.493', 'section_17_para_14: 0.493', 'section_40_para_13: 0.493', 'section_94_para_17: 0.493', 'section_13_para_20: 0.492', 'section_89_para_24: 0.492', 'section_75_para_14: 0.492', 'section_82_para_21: 0.492', 'section_84_para_4: 0.492', 'section_16_para_25: 0.492', 'section_18_para_8: 0.491', 'section_47_para_5: 0.490', 'section_12_para_27: 0.490', 'section_13_para_7: 0.490', 'section_53_para_20: 0.490', 'section_94_para_5: 0.490', 'section_13_para_12: 0.489', 'section_27_para_11: 0.489', 'section_73_para_6: 0.489', 'section_74_para_11: 0.489', 'section_93_para_4: 0.488', 'section_70_para_7: 0.488', 'section_60_para_16: 0.488', 'section_66_para_18: 0.487', 'section_89_para_8: 0.487', 'section_2_para_12: 0.486', 'section_12_para_15: 0.486', 'section_75_para_6: 0.486', 'section_0_para_10: 0.486', 'section_72_para_4: 0.486', 'section_44_para_8: 0.485', 'section_72_para_27: 0.485', 'section_18_para_26: 0.485', 'section_85_para_12: 0.485', 'section_43_para_20: 0.485', 'section_86_para_24: 0.484', 'section_77_para_24: 0.484', 'section_65_para_22: 0.484', 'section_65_para_24: 0.484', 'section_60_para_4: 0.484', 'section_75_para_8: 0.484', 'section_20_para_21: 0.484', 'section_35_para_26: 0.484', 'section_83_para_27: 0.484', 'section_10_para_17: 0.483', 'section_35_para_25: 0.483', 'section_20_para_9: 0.483', 'section_43_para_16: 0.482', 'section_13_para_27: 0.482', 'section_18_para_12: 0.482', 'section_61_para_20: 0.481', 'section_13_para_19: 0.481', 'section_52_para_18: 0.481', 'section_8_para_8: 0.481', 'section_62_para_13: 0.481', 'section_57_para_26: 0.480', 'section_14_para_13: 0.480', 'section_8_para_23: 0.480', 'section_28_para_6: 0.480', 'section_27_para_24: 0.479', 'section_37_para_11: 0.479', 'section_39_para_5: 0.478', 'section_51_para_11: 0.478', 'section_3_para_24: 0.478', 'section_2_para_21: 0.478', 'section_14_para_25: 0.478', 'section_46_para_5: 0.477', 'section_90_para_11: 0.477', 'section_17_para_20: 0.477', 'section_41_para_8: 0.477', 'section_92_para_8: 0.477', 'section_27_para_22: 0.475', 'section_46_para_27: 0.475', 'section_76_para_7: 0.475', 'section_13_para_22: 0.475', 'section_63_para_13: 0.475', 'section_3_para_18: 0.475', 'section_59_para_19: 0.475', 'section_3_para_23: 0.474', 'section_13_para_15: 0.474', 'section_41_para_16: 0.474', 'section_34_para_18: 0.474', 'section_67_para_6: 0.474', 'section_12_para_16: 0.474', 'section_46_para_24: 0.473', 'section_55_para_7: 0.473', 'section_6_para_13: 0.473', 'section_74_para_5: 0.473', 'section_60_para_19: 0.473', 'section_20_para_18: 0.473', 'section_65_para_17: 0.472', 'section_72_para_19: 0.472', 'section_52_para_6: 0.472', 'section_6_para_11: 0.472', 'section_41_para_19: 0.472', 'section_93_para_11: 0.472', 'section_72_para_13: 0.472', 'section_78_para_15: 0.471', 'section_23_para_25: 0.471', 'section_1_para_13: 0.471', 'section_70_para_9: 0.471', 'section_64_para_20: 0.470', 'section_47_para_9: 0.470', 'section_12_para_19: 0.470', 'section_95_para_10: 0.470', 'section_95_para_8: 0.470', 'section_22_para_9: 0.470', 'section_62_para_11: 0.469', 'section_19_para_5: 0.469', 'section_57_para_4: 0.469', 'section_82_para_13: 0.469', 'section_18_para_17: 0.469', 'section_93_para_16: 0.468', 'section_67_para_9: 0.468', 'section_32_para_26: 0.468', 'section_63_para_23: 0.468', 'section_66_para_20: 0.468', 'section_12_para_18: 0.468', 'section_16_para_24: 0.468', 'section_65_para_25: 0.467', 'section_65_para_16: 0.467', 'section_30_para_18: 0.466', 'section_89_para_14: 0.466', 'section_91_para_26: 0.466', 'section_7_para_18: 0.466', 'section_27_para_19: 0.466', 'section_13_para_25: 0.466', 'section_5_para_13: 0.465', 'section_67_para_14: 0.465', 'section_36_para_4: 0.465', 'section_70_para_21: 0.465', 'section_73_para_11: 0.464', 'section_60_para_17: 0.464', 'section_84_para_9: 0.464', 'section_3_para_19: 0.464', 'section_2_para_14: 0.464', 'section_27_para_18: 0.463', 'section_85_para_25: 0.463', 'section_30_para_23: 0.463', 'section_53_para_7: 0.463', 'section_74_para_7: 0.463', 'section_24_para_14: 0.462', 'section_4_para_22: 0.462', 'section_10_para_8: 0.462', 'section_62_para_12: 0.462', 'section_74_para_17: 0.462', 'section_60_para_14: 0.461', 'section_15_para_14: 0.461', 'section_56_para_5: 0.461', 'section_14_para_21: 0.461', 'section_18_para_11: 0.461', 'section_79_para_14: 0.461', 'section_79_para_6: 0.461', 'section_33_para_12: 0.461', 'section_43_para_19: 0.461', 'section_5_para_17: 0.460', 'section_56_para_24: 0.460', 'section_8_para_12: 0.460', 'section_59_para_10: 0.459', 'section_74_para_10: 0.459', 'section_34_para_13: 0.459', 'section_52_para_8: 0.459', 'section_36_para_10: 0.459', 'section_22_para_7: 0.459', 'section_92_para_5: 0.458', 'section_52_para_19: 0.458', 'section_3_para_4: 0.457', 'section_42_para_13: 0.457', 'section_35_para_19: 0.457', 'section_21_para_27: 0.457', 'section_60_para_9: 0.456', 'section_20_para_13: 0.456', 'section_93_para_13: 0.456', 'section_16_para_27: 0.456', 'section_20_para_14: 0.456', 'section_57_para_19: 0.456', 'section_10_para_12: 0.455', 'section_43_para_6: 0.455', 'section_24_para_16: 0.455', 'section_0_para_14: 0.455', 'section_41_para_24: 0.455', 'section_28_para_11: 0.454', 'section_8_para_18: 0.454', 'section_85_para_16: 0.454', 'section_90_para_22: 0.454', 'section_94_para_10: 0.453', 'section_89_para_16: 0.453', 'section_94_para_7: 0.453', 'section_91_para_10: 0.453', 'section_46_para_4: 0.453', 'section_22_para_26: 0.452', 'section_82_para_19: 0.452', 'section_5_para_11: 0.452', 'section_34_para_6: 0.452', 'section_35_para_9: 0.451', 'section_1_para_14: 0.451', 'section_6_para_10: 0.451', 'section_80_para_20: 0.451', 'section_85_para_23: 0.451', 'section_2_para_4: 0.451', 'section_47_para_11: 0.451', 'section_93_para_8: 0.451', 'section_4_para_7: 0.451', 'section_89_para_3: 0.450', 'section_15_para_3: 0.450', 'section_21_para_3: 0.450', 'section_91_para_3: 0.450', 'section_11_para_3: 0.450', 'section_13_para_3: 0.450', 'section_1_para_3: 0.450', 'section_7_para_3: 0.450', 'section_41_para_3: 0.450', 'section_49_para_3: 0.450', 'section_79_para_3: 0.450', 'section_39_para_3: 0.450', 'section_61_para_3: 0.450', 'section_43_para_3: 0.450', 'section_5_para_3: 0.450', 'section_51_para_3: 0.450', 'section_47_para_3: 0.450', 'section_53_para_3: 0.450', 'section_93_para_3: 0.450', 'section_45_para_3: 0.450', 'section_35_para_3: 0.450', 'section_59_para_3: 0.450', 'section_95_para_3: 0.450', 'section_77_para_3: 0.450', 'section_85_para_3: 0.450', 'section_3_para_3: 0.450', 'section_65_para_3: 0.450', 'section_9_para_3: 0.450', 'section_27_para_3: 0.450', 'section_83_para_3: 0.450', 'section_69_para_3: 0.450', 'section_19_para_3: 0.450', 'section_23_para_3: 0.450', 'section_37_para_3: 0.450', 'section_71_para_3: 0.450', 'section_75_para_3: 0.450', 'section_17_para_3: 0.450', 'section_73_para_3: 0.450', 'section_25_para_3: 0.450', 'section_55_para_3: 0.450', 'section_67_para_3: 0.450', 'section_87_para_3: 0.450', 'section_29_para_3: 0.450', 'section_57_para_3: 0.450', 'section_81_para_3: 0.450', 'section_63_para_3: 0.450', 'section_33_para_3: 0.450', 'section_31_para_3: 0.450', 'section_3_para_12: 0.450', 'section_39_para_18: 0.450', 'section_40_para_25: 0.449', 'section_20_para_22: 0.449', 'section_71_para_4: 0.449', 'section_72_para_10: 0.449', 'section_8_para_24: 0.449', 'section_33_para_20: 0.448', 'section_65_para_19: 0.448', 'section_23_para_19: 0.447', 'section_85_para_9: 0.447', 'section_70_para_10: 0.447', 'section_86_para_22: 0.446', 'section_37_para_16: 0.446', 'section_40_para_8: 0.446', 'section_0_para_3: 0.446', 'section_43_para_17: 0.446', 'section_14_para_24: 0.445', 'section_41_para_4: 0.445', 'section_52_para_7: 0.445', 'section_18_para_4: 0.445', 'section_59_para_12: 0.445', 'section_64_para_11: 0.445', 'section_39_para_9: 0.445', 'section_61_para_14: 0.444', 'section_64_para_24: 0.444', 'section_61_para_22: 0.444', 'section_9_para_15: 0.444', 'section_66_para_16: 0.444', 'section_84_para_11: 0.444', 'section_37_para_23: 0.444', 'section_47_para_23: 0.443', 'section_3_para_6: 0.443', 'section_72_para_25: 0.443', 'section_25_para_11: 0.443', 'section_12_para_22: 0.443', 'section_75_para_25: 0.443', 'section_59_para_9: 0.443', 'section_83_para_14: 0.443', 'section_40_para_22: 0.442', 'section_51_para_10: 0.442', 'section_37_para_19: 0.442', 'section_16_para_5: 0.442', 'section_47_para_12: 0.442', 'section_75_para_15: 0.442', 'section_87_para_14: 0.442', 'section_72_para_12: 0.442', 'section_14_para_5: 0.441', 'section_21_para_20: 0.441', 'section_40_para_24: 0.441', 'section_14_para_14: 0.441', 'section_58_para_9: 0.440', 'section_71_para_12: 0.439', 'section_28_para_14: 0.439', 'section_78_para_27: 0.438', 'section_38_para_5: 0.438', 'section_72_para_15: 0.438', 'section_84_para_20: 0.437', 'section_14_para_6: 0.437', 'section_10_para_16: 0.437', 'section_83_para_4: 0.437', 'section_25_para_27: 0.436', 'section_18_para_21: 0.436', 'section_20_para_23: 0.435', 'section_81_para_5: 0.435', 'section_42_para_22: 0.434', 'section_22_para_16: 0.434', 'section_41_para_26: 0.434', 'section_90_para_25: 0.434', 'section_61_para_23: 0.434', 'section_42_para_18: 0.433', 'section_48_para_10: 0.433', 'section_92_para_24: 0.433', 'section_50_para_8: 0.433', 'section_4_para_21: 0.433', 'section_77_para_23: 0.432', 'section_61_para_10: 0.432', 'section_80_para_14: 0.432', 'section_11_para_6: 0.431', 'section_6_para_17: 0.431', 'section_41_para_22: 0.431', 'section_80_para_10: 0.431', 'section_26_para_13: 0.431', 'section_45_para_21: 0.430', 'section_30_para_4: 0.430', 'section_37_para_17: 0.430', 'section_16_para_26: 0.430', 'section_42_para_25: 0.429', 'section_86_para_8: 0.429', 'section_21_para_10: 0.429', 'section_23_para_5: 0.429', 'section_36_para_9: 0.428', 'section_51_para_9: 0.427', 'section_42_para_20: 0.427', 'section_35_para_6: 0.427', 'section_6_para_9: 0.427', 'section_17_para_21: 0.427', 'section_74_para_4: 0.426', 'section_57_para_27: 0.426', 'section_25_para_19: 0.426', 'section_91_para_19: 0.425', 'section_9_para_18: 0.425', 'section_14_para_9: 0.425', 'section_27_para_8: 0.425', 'section_51_para_18: 0.424', 'section_82_para_9: 0.424', 'section_57_para_6: 0.424', 'section_39_para_16: 0.423', 'section_14_para_10: 0.423', 'section_28_para_20: 0.423', 'section_66_para_11: 0.422', 'section_89_para_23: 0.422', 'section_63_para_14: 0.422', 'section_50_para_19: 0.422', 'section_92_para_4: 0.421', 'section_28_para_13: 0.421', 'section_84_para_10: 0.421', 'section_68_para_16: 0.421', 'section_39_para_22: 0.421', 'section_37_para_15: 0.421', 'section_50_para_10: 0.420', 'section_1_para_9: 0.420', 'section_15_para_18: 0.420', 'section_50_para_16: 0.419', 'section_47_para_17: 0.419', 'section_30_para_10: 0.419', 'section_10_para_26: 0.419', 'section_22_para_12: 0.419', 'section_70_para_13: 0.419', 'section_54_para_24: 0.419', 'section_15_para_16: 0.419', 'section_64_para_13: 0.418', 'section_22_para_24: 0.418', 'section_11_para_16: 0.418', 'section_92_para_14: 0.418', 'section_91_para_23: 0.418', 'section_60_para_23: 0.418', 'section_91_para_6: 0.418', 'section_9_para_9: 0.418', 'section_35_para_12: 0.418', 'section_2_para_15: 0.417', 'section_20_para_16: 0.417', 'section_91_para_12: 0.417', 'section_21_para_13: 0.417', 'section_73_para_15: 0.417', 'section_72_para_20: 0.417', 'section_25_para_23: 0.416', 'section_77_para_11: 0.416', 'section_58_para_20: 0.416', 'section_9_para_22: 0.416', 'section_94_para_20: 0.416', 'section_34_para_10: 0.416', 'section_67_para_19: 0.416', 'section_84_para_8: 0.416', 'section_9_para_27: 0.415', 'section_23_para_20: 0.415', 'section_83_para_7: 0.415', 'section_56_para_26: 0.415', 'section_5_para_9: 0.415', 'section_49_para_22: 0.415', 'section_72_para_6: 0.415', 'section_6_para_16: 0.415', 'section_58_para_23: 0.415', 'section_80_para_19: 0.414', 'section_27_para_10: 0.414', 'section_70_para_5: 0.414', 'section_22_para_25: 0.414', 'section_61_para_26: 0.414', 'section_49_para_15: 0.414', 'section_11_para_10: 0.413', 'section_0_para_17: 0.412', 'section_15_para_20: 0.411', 'section_39_para_24: 0.411', 'section_73_para_17: 0.411', 'section_23_para_9: 0.411', 'section_25_para_13: 0.410', 'section_30_para_16: 0.410', 'section_71_para_7: 0.410', 'section_14_para_8: 0.409', 'section_49_para_26: 0.409', 'section_82_para_16: 0.409', 'section_32_para_18: 0.409', 'section_59_para_13: 0.409', 'section_40_para_6: 0.409', 'section_57_para_15: 0.409', 'section_12_para_23: 0.408', 'section_8_para_22: 0.408', 'section_20_para_17: 0.408', 'section_76_para_10: 0.408', 'section_22_para_5: 0.408', 'section_71_para_15: 0.408', 'section_23_para_11: 0.408', 'section_80_para_9: 0.407', 'section_66_para_6: 0.407', 'section_79_para_23: 0.407', 'section_56_para_9: 0.407', 'section_52_para_20: 0.406', 'section_71_para_22: 0.406', 'section_36_para_12: 0.406', 'section_14_para_22: 0.406', 'section_75_para_13: 0.405', 'section_28_para_22: 0.405', 'section_90_para_12: 0.405', 'section_91_para_17: 0.405', 'section_48_para_27: 0.404', 'section_35_para_8: 0.404', 'section_28_para_21: 0.404', 'section_45_para_12: 0.404', 'section_12_para_12: 0.404', 'section_64_para_4: 0.404', 'section_41_para_9: 0.404', 'section_41_para_21: 0.404', 'section_40_para_18: 0.403', 'section_15_para_12: 0.403', 'section_16_para_6: 0.403', 'section_65_para_5: 0.403', 'section_7_para_5: 0.403', 'section_61_para_18: 0.402', 'section_17_para_17: 0.402', 'section_35_para_7: 0.402', 'section_25_para_25: 0.402', 'section_72_para_16: 0.402', 'section_17_para_27: 0.402', 'section_37_para_22: 0.401', 'section_66_para_27: 0.401', 'section_11_para_21: 0.401', 'section_92_para_21: 0.401', 'section_8_para_5: 0.401', 'section_52_para_9: 0.400', 'section_44_para_6: 0.400', 'section_82_para_11: 0.400', 'section_19_para_17: 0.400', 'section_62_para_9: 0.400', 'section_9_para_13: 0.399', 'section_62_para_4: 0.399', 'section_61_para_27: 0.398', 'section_69_para_11: 0.398', 'section_10_para_13: 0.398', 'section_80_para_8: 0.398', 'section_93_para_20: 0.398', 'section_73_para_21: 0.397', 'section_51_para_16: 0.397', 'section_29_para_23: 0.397', 'section_36_para_7: 0.396', 'section_43_para_18: 0.396', 'section_17_para_19: 0.396', 'section_11_para_4: 0.396', 'section_66_para_7: 0.396', 'section_18_para_10: 0.396', 'section_29_para_9: 0.396', 'section_58_para_18: 0.395', 'section_74_para_19: 0.395', 'section_10_para_4: 0.395', 'section_38_para_12: 0.395', 'section_92_para_18: 0.395', 'section_15_para_27: 0.395', 'section_40_para_21: 0.395', 'section_77_para_19: 0.394', 'section_63_para_12: 0.394', 'section_19_para_10: 0.394', 'section_85_para_20: 0.393', 'section_21_para_18: 0.393', 'section_85_para_6: 0.393', 'section_44_para_24: 0.393', 'section_31_para_19: 0.393', 'section_88_para_7: 0.392', 'section_39_para_17: 0.392', 'section_25_para_21: 0.391', 'section_67_para_26: 0.391', 'section_16_para_8: 0.391', 'section_82_para_24: 0.391', 'section_91_para_24: 0.391', 'section_3_para_26: 0.391', 'section_31_para_15: 0.391', 'section_44_para_20: 0.391', 'section_90_para_8: 0.390', 'section_70_para_11: 0.390', 'section_4_para_27: 0.390', 'section_19_para_6: 0.390', 'section_23_para_22: 0.389', 'section_62_para_23: 0.389', 'section_72_para_9: 0.389', 'section_84_para_27: 0.389', 'section_29_para_8: 0.389', 'section_61_para_11: 0.388', 'section_19_para_22: 0.388', 'section_11_para_8: 0.388', 'section_28_para_10: 0.388', 'section_22_para_21: 0.388', 'section_47_para_13: 0.388', 'section_49_para_13: 0.388', 'section_66_para_12: 0.387', 'section_70_para_8: 0.387', 'section_12_para_13: 0.387', 'section_75_para_21: 0.387', 'section_95_para_6: 0.387', 'section_12_para_6: 0.387', 'section_38_para_8: 0.386', 'section_80_para_11: 0.386', 'section_57_para_25: 0.385', 'section_73_para_19: 0.385', 'section_22_para_22: 0.385', 'section_21_para_26: 0.385', 'section_42_para_7: 0.385', 'section_29_para_22: 0.385', 'section_46_para_9: 0.385', 'section_75_para_9: 0.384', 'section_2_para_16: 0.384', 'section_38_para_16: 0.384', 'section_23_para_16: 0.383', 'section_28_para_24: 0.383', 'section_50_para_11: 0.383', 'section_35_para_15: 0.383', 'section_44_para_21: 0.383', 'section_16_para_4: 0.383', 'section_10_para_14: 0.382', 'section_20_para_19: 0.382', 'section_21_para_7: 0.382', 'section_26_para_9: 0.382', 'section_39_para_23: 0.382', 'section_58_para_4: 0.382', 'section_61_para_24: 0.382', 'section_62_para_25: 0.382', 'section_65_para_18: 0.382', 'section_41_para_6: 0.382', 'section_18_para_7: 0.382', 'section_95_para_7: 0.381', 'section_43_para_8: 0.381', 'section_73_para_5: 0.381', 'section_42_para_12: 0.381', 'section_47_para_10: 0.381', 'section_29_para_4: 0.381', 'section_15_para_4: 0.380', 'section_72_para_26: 0.380', 'section_43_para_9: 0.380', 'section_9_para_12: 0.380', 'section_70_para_14: 0.379', 'section_41_para_20: 0.379', 'section_34_para_19: 0.379', 'section_67_para_17: 0.378', 'section_2_para_5: 0.378', 'section_33_para_26: 0.378', 'section_26_para_11: 0.378', 'section_53_para_21: 0.378', 'section_61_para_25: 0.377', 'section_64_para_16: 0.377', 'section_14_para_18: 0.377', 'section_12_para_21: 0.377', 'section_80_para_7: 0.377', 'section_94_para_9: 0.377', 'section_74_para_24: 0.377', 'section_21_para_22: 0.376', 'section_49_para_8: 0.376', 'section_57_para_9: 0.376', 'section_24_para_13: 0.376', 'section_16_para_10: 0.376', 'section_46_para_25: 0.376', 'section_78_para_10: 0.375', 'section_60_para_7: 0.375', 'section_73_para_13: 0.375', 'section_34_para_20: 0.375', 'section_72_para_17: 0.374', 'section_10_para_15: 0.374', 'section_16_para_11: 0.374', 'section_67_para_25: 0.374', 'section_16_para_23: 0.374', 'section_84_para_13: 0.373', 'section_48_para_9: 0.373', 'section_90_para_7: 0.373', 'section_22_para_14: 0.373', 'section_8_para_7: 0.373', 'section_22_para_15: 0.373', 'section_88_para_4: 0.373', 'section_35_para_24: 0.373', 'section_87_para_5: 0.373', 'section_29_para_27: 0.373', 'section_39_para_15: 0.373', 'section_40_para_11: 0.373', 'section_19_para_11: 0.372', 'section_9_para_4: 0.372', 'section_85_para_19: 0.372', 'section_15_para_19: 0.372', 'section_39_para_11: 0.372', 'section_55_para_20: 0.372', 'section_72_para_24: 0.371', 'section_75_para_12: 0.371', 'section_91_para_11: 0.371', 'section_50_para_7: 0.371', 'section_48_para_8: 0.371', 'section_66_para_15: 0.370', 'section_59_para_21: 0.370', 'section_83_para_18: 0.370', 'section_39_para_8: 0.370', 'section_24_para_12: 0.370', 'section_72_para_21: 0.370', 'section_61_para_13: 0.370', 'section_42_para_8: 0.370', 'section_94_para_12: 0.369', 'section_49_para_24: 0.369', 'section_91_para_9: 0.369', 'section_15_para_6: 0.369', 'section_34_para_12: 0.368', 'section_54_para_7: 0.368', 'section_21_para_19: 0.368', 'section_45_para_19: 0.368', 'section_82_para_5: 0.368', 'section_6_para_22: 0.367', 'section_15_para_23: 0.367', 'section_0_para_9: 0.367', 'section_10_para_11: 0.367', 'section_32_para_23: 0.367', 'section_75_para_5: 0.366', 'section_11_para_11: 0.366', 'section_56_para_27: 0.366', 'section_22_para_18: 0.366', 'section_63_para_20: 0.366', 'section_30_para_24: 0.365', 'section_38_para_15: 0.365', 'section_15_para_8: 0.365', 'section_52_para_14: 0.365', 'section_34_para_23: 0.365', 'section_74_para_21: 0.365', 'section_41_para_11: 0.364', 'section_91_para_5: 0.364', 'section_6_para_14: 0.364', 'section_58_para_11: 0.364', 'section_43_para_11: 0.364', 'section_45_para_5: 0.363', 'section_42_para_11: 0.363', 'section_67_para_12: 0.363', 'section_33_para_21: 0.363', 'section_61_para_5: 0.363', 'section_87_para_25: 0.363', 'section_28_para_12: 0.363', 'section_9_para_5: 0.362', 'section_75_para_4: 0.362', 'section_15_para_22: 0.361', 'section_82_para_15: 0.361', 'section_48_para_11: 0.361', 'section_45_para_15: 0.361', 'section_31_para_27: 0.361', 'section_33_para_7: 0.360', 'section_86_para_25: 0.360', 'section_71_para_19: 0.360', 'section_2_para_7: 0.360', 'section_31_para_12: 0.360', 'section_13_para_11: 0.360', 'section_22_para_20: 0.360', 'section_87_para_18: 0.359', 'section_44_para_4: 0.359', 'section_52_para_21: 0.359', 'section_91_para_15: 0.359', 'section_43_para_7: 0.359', 'section_61_para_21: 0.359', 'section_53_para_8: 0.359', 'section_66_para_23: 0.358', 'section_51_para_23: 0.358', 'section_40_para_26: 0.358', 'section_6_para_25: 0.358', 'section_84_para_16: 0.358', 'section_41_para_5: 0.358', 'section_11_para_7: 0.358', 'section_1_para_15: 0.357', 'section_71_para_24: 0.357', 'section_71_para_5: 0.357', 'section_85_para_7: 0.357', 'section_36_para_15: 0.357', 'section_80_para_23: 0.357', 'section_8_para_14: 0.356', 'section_25_para_18: 0.356', 'section_91_para_27: 0.356', 'section_4_para_13: 0.356', 'section_48_para_17: 0.356', 'section_67_para_7: 0.356', 'section_14_para_4: 0.356', 'section_25_para_9: 0.355', 'section_42_para_15: 0.355', 'section_3_para_15: 0.355', 'section_49_para_17: 0.355', 'section_70_para_19: 0.355', 'section_32_para_15: 0.354', 'section_67_para_5: 0.353', 'section_69_para_4: 0.353', 'section_57_para_13: 0.353', 'section_10_para_9: 0.353', 'section_33_para_17: 0.352', 'section_36_para_18: 0.352', 'section_41_para_12: 0.352', 'section_66_para_19: 0.352', 'section_47_para_8: 0.352', 'section_44_para_26: 0.352', 'section_46_para_20: 0.352', 'section_42_para_14: 0.352', 'section_77_para_18: 0.352', 'section_67_para_21: 0.352', 'section_46_para_21: 0.351', 'section_39_para_21: 0.351', 'section_81_para_4: 0.351', 'section_40_para_16: 0.351', 'section_76_para_12: 0.351', 'section_23_para_8: 0.350', 'section_28_para_28: 0.350', 'section_42_para_27: 0.349', 'section_23_para_26: 0.349', 'section_84_para_24: 0.349', 'section_49_para_21: 0.349', 'section_45_para_8: 0.349', 'section_76_para_5: 0.349', 'section_68_para_26: 0.349', 'section_85_para_21: 0.348', 'section_75_para_16: 0.348', 'section_87_para_22: 0.348', 'section_41_para_10: 0.347', 'section_62_para_24: 0.347', 'section_88_para_6: 0.347', 'section_13_para_8: 0.347', 'section_4_para_9: 0.347', 'section_0_para_24: 0.347', 'section_32_para_27: 0.347', 'section_40_para_9: 0.347', 'section_15_para_25: 0.347', 'section_83_para_20: 0.347', 'section_58_para_13: 0.346', 'section_35_para_20: 0.346', 'section_35_para_23: 0.346', 'section_71_para_17: 0.346', 'section_73_para_24: 0.346', 'section_16_para_19: 0.345', 'section_14_para_19: 0.344', 'section_71_para_18: 0.344', 'section_75_para_11: 0.344', 'section_37_para_8: 0.343', 'section_70_para_17: 0.343', 'section_1_para_6: 0.343', 'section_46_para_22: 0.343', 'section_39_para_20: 0.343', 'section_77_para_9: 0.343', 'section_91_para_25: 0.342', 'section_45_para_4: 0.342', 'section_49_para_5: 0.342', 'section_21_para_15: 0.342', 'section_21_para_23: 0.342', 'section_78_para_16: 0.341', 'section_84_para_19: 0.341', 'section_22_para_4: 0.341', 'section_60_para_24: 0.341', 'section_35_para_21: 0.341', 'section_45_para_26: 0.341', 'section_23_para_15: 0.341', 'section_24_para_22: 0.341', 'section_71_para_10: 0.341', 'section_47_para_20: 0.341', 'section_84_para_15: 0.340', 'section_28_para_25: 0.340', 'section_74_para_9: 0.340', 'section_12_para_7: 0.340', 'section_87_para_27: 0.340', 'section_14_para_11: 0.340', 'section_51_para_12: 0.340', 'section_47_para_24: 0.340', 'section_71_para_9: 0.339', 'section_29_para_24: 0.339', 'section_11_para_27: 0.339', 'section_42_para_24: 0.339', 'section_49_para_4: 0.339', 'section_45_para_18: 0.339', 'section_92_para_25: 0.338', 'section_11_para_24: 0.338', 'section_53_para_19: 0.338', 'section_31_para_7: 0.338', 'section_23_para_14: 0.337', 'section_62_para_6: 0.337', 'section_17_para_8: 0.337', 'section_65_para_9: 0.337', 'section_80_para_24: 0.337', 'section_42_para_16: 0.337', 'section_80_para_22: 0.337', 'section_33_para_27: 0.336', 'section_92_para_19: 0.336', 'section_14_para_17: 0.336', 'section_38_para_19: 0.336', 'section_26_para_15: 0.336', 'section_73_para_12: 0.336', 'section_49_para_7: 0.336', 'section_23_para_12: 0.335', 'section_69_para_12: 0.335', 'section_27_para_14: 0.335', 'section_30_para_19: 0.335', 'section_53_para_17: 0.335', 'section_58_para_10: 0.335', 'section_43_para_10: 0.334', 'section_23_para_10: 0.333', 'section_60_para_22: 0.333', 'section_76_para_8: 0.333', 'section_15_para_24: 0.333', 'section_35_para_10: 0.333', 'section_79_para_11: 0.333', 'section_47_para_22: 0.333', 'section_15_para_10: 0.333', 'section_92_para_11: 0.332', 'section_24_para_19: 0.332', 'section_80_para_18: 0.332', 'section_86_para_19: 0.332', 'section_40_para_14: 0.332', 'section_33_para_11: 0.332', 'section_19_para_8: 0.332', 'section_19_para_21: 0.332', 'section_1_para_8: 0.332', 'section_29_para_12: 0.332', 'section_51_para_15: 0.332', 'section_59_para_6: 0.332', 'section_12_para_20: 0.332', 'section_80_para_25: 0.332', 'section_37_para_21: 0.331', 'section_51_para_4: 0.331', 'section_54_para_26: 0.331', 'section_10_para_5: 0.331', 'section_34_para_5: 0.331', 'section_4_para_15: 0.331', 'section_31_para_16: 0.331', 'section_44_para_23: 0.330', 'section_48_para_6: 0.330', 'section_15_para_11: 0.330', 'section_10_para_27: 0.330', 'section_19_para_12: 0.330', 'section_39_para_10: 0.330', 'section_72_para_11: 0.330', 'section_13_para_9: 0.330', 'section_44_para_18: 0.330', 'section_60_para_15: 0.329', 'section_36_para_5: 0.329', 'section_21_para_12: 0.328', 'section_35_para_4: 0.328', 'section_31_para_22: 0.328', 'section_13_para_23: 0.328', 'section_13_para_21: 0.328', 'section_47_para_18: 0.328', 'section_30_para_26: 0.328', 'section_79_para_20: 0.327', 'section_72_para_14: 0.327', 'section_44_para_9: 0.327', 'section_1_para_16: 0.327', 'section_47_para_14: 0.327', 'section_57_para_20: 0.326', 'section_18_para_20: 0.326', 'section_45_para_23: 0.326', 'section_42_para_6: 0.326', 'section_73_para_10: 0.326', 'section_43_para_4: 0.326', 'section_9_para_11: 0.325', 'section_14_para_12: 0.325', 'section_64_para_10: 0.325', 'section_44_para_13: 0.324', 'section_16_para_12: 0.324', 'section_9_para_10: 0.324', 'section_33_para_19: 0.323', 'section_62_para_20: 0.323', 'section_49_para_27: 0.323', 'section_46_para_16: 0.323', 'section_93_para_10: 0.323', 'section_24_para_26: 0.323', 'section_65_para_6: 0.323', 'section_70_para_16: 0.323', 'section_31_para_23: 0.322', 'section_23_para_17: 0.322', 'section_28_para_16: 0.322', 'section_77_para_8: 0.322', 'section_35_para_11: 0.322', 'section_72_para_22: 0.322', 'section_74_para_23: 0.321', 'section_40_para_20: 0.321', 'section_58_para_17: 0.321', 'section_42_para_23: 0.321', 'section_8_para_20: 0.321', 'section_78_para_18: 0.321', 'section_33_para_16: 0.321', 'section_23_para_18: 0.321', 'section_53_para_15: 0.320', 'section_40_para_23: 0.320', 'section_85_para_24: 0.320', 'section_64_para_23: 0.320', 'section_9_para_23: 0.320', 'section_21_para_8: 0.320', 'section_62_para_16: 0.320', 'section_53_para_23: 0.320', 'section_29_para_16: 0.319', 'section_58_para_5: 0.319', 'section_65_para_4: 0.319', 'section_5_para_7: 0.319', 'section_51_para_5: 0.318', 'section_22_para_13: 0.318', 'section_35_para_13: 0.318', 'section_18_para_28: 0.318', 'section_24_para_18: 0.318', 'section_34_para_4: 0.318', 'section_29_para_5: 0.317', 'section_58_para_7: 0.317', 'section_22_para_8: 0.317', 'section_17_para_6: 0.317', 'section_26_para_14: 0.317', 'section_85_para_22: 0.317', 'section_23_para_24: 0.317', 'section_35_para_14: 0.317', 'section_25_para_15: 0.316', 'section_47_para_25: 0.316', 'section_62_para_22: 0.316', 'section_46_para_6: 0.316', 'section_33_para_14: 0.316', 'section_23_para_27: 0.316', 'section_63_para_28: 0.315', 'section_72_para_23: 0.315', 'section_75_para_22: 0.315', 'section_25_para_7: 0.315', 'section_90_para_16: 0.315', 'section_91_para_22: 0.315', 'section_64_para_6: 0.315', 'section_42_para_17: 0.314', 'section_45_para_20: 0.314', 'section_48_para_20: 0.314', 'section_75_para_7: 0.314', 'section_38_para_4: 0.314', 'section_3_para_10: 0.314', 'section_89_para_20: 0.313', 'section_36_para_21: 0.313', 'section_74_para_20: 0.313', 'section_86_para_23: 0.313', 'section_52_para_15: 0.313', 'section_40_para_19: 0.312', 'section_65_para_21: 0.312', 'section_28_para_23: 0.312', 'section_93_para_12: 0.312', 'section_72_para_5: 0.312', 'section_64_para_17: 0.311', 'section_7_para_11: 0.311', 'section_28_para_17: 0.311', 'section_74_para_25: 0.311', 'section_4_para_6: 0.311', 'section_61_para_12: 0.310', 'section_58_para_8: 0.310', 'section_90_para_13: 0.310', 'section_51_para_7: 0.309', 'section_42_para_5: 0.309', 'section_67_para_10: 0.309', 'section_28_para_7: 0.309', 'section_41_para_14: 0.309', 'section_27_para_15: 0.308', 'section_78_para_13: 0.308', 'section_33_para_22: 0.308', 'section_60_para_13: 0.308', 'section_74_para_22: 0.307', 'section_18_para_16: 0.307', 'section_57_para_24: 0.307', 'section_43_para_5: 0.307', 'section_1_para_10: 0.307', 'section_36_para_27: 0.307', 'section_46_para_14: 0.307', 'section_36_para_6: 0.307', 'section_54_para_23: 0.306', 'section_10_para_22: 0.306', 'section_80_para_27: 0.306', 'section_31_para_17: 0.306', 'section_73_para_7: 0.305', 'section_65_para_13: 0.304', 'section_33_para_23: 0.304', 'section_29_para_19: 0.304', 'section_7_para_13: 0.304', 'section_23_para_6: 0.304', 'section_79_para_13: 0.304', 'section_29_para_20: 0.303', 'section_46_para_12: 0.303', 'section_48_para_13: 0.303', 'section_29_para_13: 0.303', 'section_38_para_11: 0.303', 'section_45_para_13: 0.303', 'section_31_para_18: 0.302', 'section_26_para_4: 0.302', 'section_85_para_18: 0.302', 'section_6_para_7: 0.302', 'section_28_para_19: 0.302', 'section_19_para_15: 0.302', 'section_33_para_24: 0.301', 'section_23_para_23: 0.301', 'section_29_para_7: 0.301', 'section_59_para_5: 0.301', 'section_84_para_25: 0.301', 'section_11_para_15: 0.300', 'section_68_para_11: 0.300', 'section_91_para_20: 0.300', 'section_88_para_9: 0.300', 'section_49_para_9: 0.300', 'section_43_para_27: 0.300', 'section_44_para_14: 0.299', 'section_28_para_4: 0.299', 'section_63_para_6: 0.298', 'section_41_para_13: 0.298', 'section_29_para_18: 0.298', 'section_76_para_6: 0.298', 'section_19_para_19: 0.298', 'section_57_para_22: 0.298', 'section_86_para_16: 0.298', 'section_86_para_11: 0.298', 'section_54_para_14: 0.298', 'section_18_para_27: 0.298', 'section_68_para_10: 0.298', 'section_16_para_21: 0.297', 'section_85_para_27: 0.297', 'section_62_para_10: 0.297', 'section_90_para_18: 0.297', 'section_94_para_13: 0.297', 'section_58_para_12: 0.297', 'section_63_para_9: 0.297', 'section_45_para_14: 0.297', 'section_87_para_26: 0.297', 'section_40_para_10: 0.296', 'section_35_para_27: 0.296', 'section_31_para_9: 0.296', 'section_32_para_6: 0.295', 'section_10_para_24: 0.295', 'section_58_para_22: 0.295', 'section_62_para_27: 0.295', 'section_83_para_24: 0.295', 'section_75_para_20: 0.294', 'section_35_para_16: 0.294', 'section_5_para_27: 0.293', 'section_13_para_16: 0.293', 'section_88_para_5: 0.293', 'section_62_para_17: 0.293', 'section_47_para_16: 0.293', 'section_12_para_17: 0.293', 'section_33_para_15: 0.293', 'section_13_para_13: 0.292', 'section_64_para_5: 0.292', 'section_18_para_22: 0.292']\n",
      "[INFO] Probability children: ['section_89_para_4: 0.729', 'section_89_para_17: 0.708', 'section_53_para_24: 0.647', 'section_20_para_7: 0.638', 'section_60_para_21: 0.631', 'section_40_para_17: 0.628', 'section_66_para_10: 0.626', 'section_89_para_15: 0.626', 'section_20_para_15: 0.622', 'section_27_para_16: 0.619', 'section_3_para_9: 0.612', 'section_18_para_9: 0.609', 'section_52_para_11: 0.604', 'section_0_para_6: 0.602', 'section_89_para_19: 0.592', 'section_39_para_7: 0.591', 'section_27_para_4: 0.587', 'section_93_para_6: 0.587', 'section_0_para_23: 0.587', 'section_47_para_7: 0.585', 'section_10_para_20: 0.585', 'section_24_para_10: 0.585', 'section_8_para_9: 0.585', 'section_15_para_17: 0.584', 'section_5_para_15: 0.584', 'section_90_para_5: 0.582', 'section_48_para_19: 0.582', 'section_21_para_17: 0.581', 'section_52_para_12: 0.581', 'section_5_para_14: 0.579', 'section_92_para_7: 0.577', 'section_82_para_4: 0.576', 'section_13_para_26: 0.575', 'section_24_para_27: 0.574', 'section_61_para_7: 0.573', 'section_67_para_15: 0.572', 'section_48_para_16: 0.571', 'section_13_para_4: 0.571', 'section_93_para_5: 0.570', 'section_14_para_7: 0.570', 'section_4_para_20: 0.569', 'section_48_para_7: 0.568', 'section_60_para_8: 0.568', 'section_48_para_5: 0.566', 'section_20_para_8: 0.566', 'section_1_para_17: 0.565', 'section_78_para_4: 0.565', 'section_3_para_22: 0.564', 'section_52_para_13: 0.564', 'section_95_para_5: 0.563', 'section_85_para_8: 0.562', 'section_89_para_10: 0.562', 'section_39_para_13: 0.562', 'section_7_para_12: 0.561', 'section_75_para_26: 0.560', 'section_2_para_23: 0.560', 'section_48_para_14: 0.559', 'section_90_para_4: 0.559', 'section_40_para_27: 0.559', 'section_90_para_27: 0.558', 'section_5_para_12: 0.557', 'section_43_para_13: 0.556', 'section_2_para_11: 0.556', 'section_15_para_26: 0.556', 'section_89_para_11: 0.556', 'section_13_para_5: 0.555', 'section_14_para_16: 0.555', 'section_95_para_9: 0.554', 'section_89_para_5: 0.554', 'section_89_para_18: 0.554', 'section_34_para_15: 0.553', 'section_77_para_10: 0.553', 'section_75_para_10: 0.553', 'section_46_para_19: 0.552', 'section_17_para_7: 0.551', 'section_30_para_15: 0.551', 'section_94_para_21: 0.549', 'section_37_para_7: 0.549', 'section_2_para_22: 0.548', 'section_35_para_5: 0.548', 'section_80_para_15: 0.548', 'section_78_para_7: 0.548', 'section_80_para_13: 0.547', 'section_83_para_26: 0.547', 'section_20_para_10: 0.547', 'section_73_para_25: 0.546', 'section_65_para_23: 0.545', 'section_59_para_7: 0.545', 'section_0_para_25: 0.545', 'section_8_para_16: 0.544', 'section_89_para_9: 0.543', 'section_66_para_9: 0.543', 'section_47_para_6: 0.542', 'section_90_para_10: 0.542', 'section_84_para_23: 0.542', 'section_37_para_14: 0.541', 'section_54_para_20: 0.541', 'section_8_para_11: 0.540', 'section_90_para_26: 0.540', 'section_77_para_15: 0.539', 'section_37_para_13: 0.539', 'section_8_para_13: 0.538', 'section_19_para_4: 0.538', 'section_24_para_17: 0.537', 'section_44_para_16: 0.537', 'section_9_para_20: 0.536', 'section_16_para_9: 0.536', 'section_46_para_26: 0.536', 'section_34_para_27: 0.536', 'section_12_para_9: 0.536', 'section_86_para_17: 0.534', 'section_91_para_4: 0.534', 'section_37_para_12: 0.534', 'section_44_para_12: 0.534', 'section_46_para_17: 0.534', 'section_5_para_10: 0.534', 'section_11_para_22: 0.534', 'section_84_para_7: 0.534', 'section_8_para_4: 0.533', 'section_77_para_17: 0.533', 'section_3_para_21: 0.533', 'section_37_para_20: 0.532', 'section_9_para_21: 0.531', 'section_59_para_8: 0.530', 'section_12_para_10: 0.530', 'section_93_para_14: 0.530', 'section_11_para_25: 0.530', 'section_92_para_15: 0.529', 'section_1_para_7: 0.529', 'section_80_para_21: 0.529', 'section_22_para_6: 0.529', 'section_90_para_9: 0.529', 'section_56_para_25: 0.528', 'section_14_para_20: 0.528', 'section_37_para_5: 0.528', 'section_41_para_17: 0.528', 'section_17_para_15: 0.527', 'section_8_para_6: 0.527', 'section_21_para_24: 0.527', 'section_20_para_20: 0.527', 'section_73_para_16: 0.526', 'section_68_para_21: 0.525', 'section_5_para_8: 0.525', 'section_63_para_27: 0.524', 'section_13_para_10: 0.524', 'section_92_para_13: 0.524', 'section_34_para_26: 0.524', 'section_80_para_17: 0.523', 'section_25_para_22: 0.523', 'section_78_para_8: 0.522', 'section_56_para_23: 0.521', 'section_79_para_24: 0.521', 'section_82_para_8: 0.521', 'section_24_para_8: 0.521', 'section_12_para_26: 0.520', 'section_47_para_15: 0.520', 'section_77_para_6: 0.520', 'section_3_para_16: 0.519', 'section_73_para_14: 0.519', 'section_82_para_7: 0.519', 'section_53_para_11: 0.519', 'section_71_para_16: 0.518', 'section_29_para_10: 0.518', 'section_10_para_23: 0.518', 'section_42_para_19: 0.517', 'section_79_para_9: 0.517', 'section_15_para_13: 0.517', 'section_58_para_14: 0.516', 'section_6_para_4: 0.516', 'section_19_para_7: 0.516', 'section_12_para_11: 0.515', 'section_4_para_16: 0.515', 'section_77_para_4: 0.515', 'section_61_para_6: 0.514', 'section_57_para_7: 0.514', 'section_70_para_12: 0.513', 'section_60_para_18: 0.513', 'section_0_para_5: 0.513', 'section_89_para_12: 0.513', 'section_21_para_14: 0.513', 'section_90_para_24: 0.513', 'section_15_para_5: 0.513', 'section_85_para_15: 0.513', 'section_90_para_17: 0.512', 'section_43_para_15: 0.511', 'section_68_para_7: 0.511', 'section_53_para_9: 0.511', 'section_44_para_10: 0.511', 'section_73_para_22: 0.511', 'section_80_para_4: 0.511', 'section_85_para_11: 0.510', 'section_77_para_16: 0.510', 'section_94_para_18: 0.509', 'section_0_para_20: 0.508', 'section_62_para_26: 0.508', 'section_21_para_9: 0.508', 'section_24_para_15: 0.508', 'section_90_para_14: 0.507', 'section_21_para_5: 0.507', 'section_3_para_5: 0.507', 'section_25_para_8: 0.507', 'section_86_para_4: 0.507', 'section_24_para_20: 0.506', 'section_36_para_13: 0.506', 'section_2_para_8: 0.506', 'section_65_para_15: 0.505', 'section_20_para_5: 0.504', 'section_83_para_9: 0.504', 'section_7_para_17: 0.504', 'section_76_para_9: 0.504', 'section_14_para_27: 0.503', 'section_39_para_12: 0.503', 'section_64_para_18: 0.502', 'section_7_para_15: 0.502', 'section_80_para_6: 0.502', 'section_11_para_12: 0.502', 'section_52_para_10: 0.502', 'section_60_para_10: 0.502', 'section_35_para_18: 0.502', 'section_92_para_10: 0.502', 'section_71_para_13: 0.502', 'section_3_para_8: 0.501', 'section_7_para_16: 0.501', 'section_20_para_24: 0.501', 'section_7_para_10: 0.501', 'section_92_para_16: 0.501', 'section_47_para_21: 0.501', 'section_60_para_12: 0.500', 'section_87_para_15: 0.500', 'section_20_para_11: 0.500', 'section_48_para_24: 0.500', 'section_24_para_9: 0.499', 'section_14_para_15: 0.499', 'section_79_para_7: 0.499', 'section_51_para_26: 0.499', 'section_4_para_24: 0.499', 'section_18_para_14: 0.499', 'section_9_para_24: 0.499', 'section_7_para_19: 0.498', 'section_69_para_10: 0.498', 'section_37_para_24: 0.497', 'section_41_para_18: 0.497', 'section_72_para_18: 0.497', 'section_2_para_13: 0.497', 'section_46_para_18: 0.497', 'section_56_para_18: 0.496', 'section_39_para_6: 0.496', 'section_53_para_14: 0.496', 'section_62_para_5: 0.496', 'section_75_para_24: 0.495', 'section_92_para_17: 0.495', 'section_2_para_18: 0.495', 'section_15_para_21: 0.495', 'section_59_para_20: 0.495', 'section_13_para_6: 0.495', 'section_79_para_5: 0.495', 'section_49_para_11: 0.495', 'section_37_para_6: 0.495', 'section_68_para_4: 0.493', 'section_8_para_17: 0.493', 'section_17_para_14: 0.493', 'section_40_para_13: 0.493', 'section_94_para_17: 0.493', 'section_13_para_20: 0.492', 'section_89_para_24: 0.492', 'section_75_para_14: 0.492', 'section_82_para_21: 0.492', 'section_84_para_4: 0.492', 'section_16_para_25: 0.492', 'section_18_para_8: 0.491', 'section_47_para_5: 0.490', 'section_12_para_27: 0.490', 'section_13_para_7: 0.490', 'section_53_para_20: 0.490', 'section_94_para_5: 0.490', 'section_13_para_12: 0.489', 'section_27_para_11: 0.489', 'section_73_para_6: 0.489', 'section_74_para_11: 0.489', 'section_93_para_4: 0.488', 'section_70_para_7: 0.488', 'section_60_para_16: 0.488', 'section_66_para_18: 0.487', 'section_89_para_8: 0.487', 'section_2_para_12: 0.486', 'section_12_para_15: 0.486', 'section_75_para_6: 0.486', 'section_0_para_10: 0.486', 'section_72_para_4: 0.486', 'section_44_para_8: 0.485', 'section_72_para_27: 0.485', 'section_18_para_26: 0.485', 'section_85_para_12: 0.485', 'section_43_para_20: 0.485', 'section_86_para_24: 0.484', 'section_77_para_24: 0.484', 'section_65_para_22: 0.484', 'section_65_para_24: 0.484', 'section_60_para_4: 0.484', 'section_75_para_8: 0.484', 'section_20_para_21: 0.484', 'section_35_para_26: 0.484', 'section_83_para_27: 0.484', 'section_10_para_17: 0.483', 'section_35_para_25: 0.483', 'section_20_para_9: 0.483', 'section_43_para_16: 0.482', 'section_13_para_27: 0.482', 'section_18_para_12: 0.482', 'section_61_para_20: 0.481', 'section_13_para_19: 0.481', 'section_52_para_18: 0.481', 'section_8_para_8: 0.481', 'section_62_para_13: 0.481', 'section_57_para_26: 0.480', 'section_14_para_13: 0.480', 'section_8_para_23: 0.480', 'section_28_para_6: 0.480', 'section_27_para_24: 0.479', 'section_37_para_11: 0.479', 'section_39_para_5: 0.478', 'section_51_para_11: 0.478', 'section_3_para_24: 0.478', 'section_2_para_21: 0.478', 'section_14_para_25: 0.478', 'section_46_para_5: 0.477', 'section_90_para_11: 0.477', 'section_17_para_20: 0.477', 'section_41_para_8: 0.477', 'section_92_para_8: 0.477', 'section_27_para_22: 0.475', 'section_46_para_27: 0.475', 'section_76_para_7: 0.475', 'section_13_para_22: 0.475', 'section_63_para_13: 0.475', 'section_3_para_18: 0.475', 'section_59_para_19: 0.475', 'section_3_para_23: 0.474', 'section_13_para_15: 0.474', 'section_41_para_16: 0.474', 'section_34_para_18: 0.474', 'section_67_para_6: 0.474', 'section_12_para_16: 0.474', 'section_46_para_24: 0.473', 'section_55_para_7: 0.473', 'section_6_para_13: 0.473', 'section_74_para_5: 0.473', 'section_60_para_19: 0.473', 'section_20_para_18: 0.473', 'section_65_para_17: 0.472', 'section_72_para_19: 0.472', 'section_52_para_6: 0.472', 'section_6_para_11: 0.472', 'section_41_para_19: 0.472', 'section_93_para_11: 0.472', 'section_72_para_13: 0.472', 'section_78_para_15: 0.471', 'section_23_para_25: 0.471', 'section_1_para_13: 0.471', 'section_70_para_9: 0.471', 'section_64_para_20: 0.470', 'section_47_para_9: 0.470', 'section_12_para_19: 0.470', 'section_95_para_10: 0.470', 'section_95_para_8: 0.470', 'section_22_para_9: 0.470', 'section_62_para_11: 0.469', 'section_19_para_5: 0.469', 'section_57_para_4: 0.469', 'section_82_para_13: 0.469', 'section_18_para_17: 0.469', 'section_93_para_16: 0.468', 'section_67_para_9: 0.468', 'section_32_para_26: 0.468', 'section_63_para_23: 0.468', 'section_66_para_20: 0.468', 'section_12_para_18: 0.468', 'section_16_para_24: 0.468', 'section_65_para_25: 0.467', 'section_65_para_16: 0.467', 'section_30_para_18: 0.466', 'section_89_para_14: 0.466', 'section_91_para_26: 0.466', 'section_7_para_18: 0.466', 'section_27_para_19: 0.466', 'section_13_para_25: 0.466', 'section_5_para_13: 0.465', 'section_67_para_14: 0.465', 'section_36_para_4: 0.465', 'section_70_para_21: 0.465', 'section_73_para_11: 0.464', 'section_60_para_17: 0.464', 'section_84_para_9: 0.464', 'section_3_para_19: 0.464', 'section_2_para_14: 0.464', 'section_27_para_18: 0.463', 'section_85_para_25: 0.463', 'section_30_para_23: 0.463', 'section_53_para_7: 0.463', 'section_74_para_7: 0.463', 'section_24_para_14: 0.462', 'section_4_para_22: 0.462', 'section_10_para_8: 0.462', 'section_62_para_12: 0.462', 'section_74_para_17: 0.462', 'section_60_para_14: 0.461', 'section_15_para_14: 0.461', 'section_56_para_5: 0.461', 'section_14_para_21: 0.461', 'section_18_para_11: 0.461', 'section_79_para_14: 0.461', 'section_79_para_6: 0.461', 'section_33_para_12: 0.461', 'section_43_para_19: 0.461', 'section_5_para_17: 0.460', 'section_56_para_24: 0.460', 'section_8_para_12: 0.460', 'section_59_para_10: 0.459', 'section_74_para_10: 0.459', 'section_34_para_13: 0.459', 'section_52_para_8: 0.459', 'section_36_para_10: 0.459', 'section_22_para_7: 0.459', 'section_92_para_5: 0.458', 'section_52_para_19: 0.458', 'section_3_para_4: 0.457', 'section_42_para_13: 0.457', 'section_35_para_19: 0.457', 'section_21_para_27: 0.457', 'section_60_para_9: 0.456', 'section_20_para_13: 0.456', 'section_93_para_13: 0.456', 'section_16_para_27: 0.456', 'section_20_para_14: 0.456', 'section_57_para_19: 0.456', 'section_10_para_12: 0.455', 'section_43_para_6: 0.455', 'section_24_para_16: 0.455', 'section_0_para_14: 0.455', 'section_41_para_24: 0.455', 'section_28_para_11: 0.454', 'section_8_para_18: 0.454', 'section_85_para_16: 0.454', 'section_90_para_22: 0.454', 'section_94_para_10: 0.453', 'section_89_para_16: 0.453', 'section_94_para_7: 0.453', 'section_91_para_10: 0.453', 'section_46_para_4: 0.453', 'section_22_para_26: 0.452', 'section_82_para_19: 0.452', 'section_5_para_11: 0.452', 'section_34_para_6: 0.452', 'section_35_para_9: 0.451', 'section_1_para_14: 0.451', 'section_6_para_10: 0.451', 'section_80_para_20: 0.451', 'section_85_para_23: 0.451', 'section_2_para_4: 0.451', 'section_47_para_11: 0.451', 'section_93_para_8: 0.451', 'section_4_para_7: 0.451', 'section_89_para_3: 0.450', 'section_15_para_3: 0.450', 'section_21_para_3: 0.450', 'section_91_para_3: 0.450', 'section_11_para_3: 0.450', 'section_13_para_3: 0.450', 'section_1_para_3: 0.450', 'section_7_para_3: 0.450', 'section_41_para_3: 0.450', 'section_49_para_3: 0.450', 'section_79_para_3: 0.450', 'section_39_para_3: 0.450', 'section_61_para_3: 0.450', 'section_43_para_3: 0.450', 'section_5_para_3: 0.450', 'section_51_para_3: 0.450', 'section_47_para_3: 0.450', 'section_53_para_3: 0.450', 'section_93_para_3: 0.450', 'section_45_para_3: 0.450', 'section_35_para_3: 0.450', 'section_59_para_3: 0.450', 'section_95_para_3: 0.450', 'section_77_para_3: 0.450', 'section_85_para_3: 0.450', 'section_3_para_3: 0.450', 'section_65_para_3: 0.450', 'section_9_para_3: 0.450', 'section_27_para_3: 0.450', 'section_83_para_3: 0.450', 'section_69_para_3: 0.450', 'section_19_para_3: 0.450', 'section_23_para_3: 0.450', 'section_37_para_3: 0.450', 'section_71_para_3: 0.450', 'section_75_para_3: 0.450', 'section_17_para_3: 0.450', 'section_73_para_3: 0.450', 'section_25_para_3: 0.450', 'section_55_para_3: 0.450', 'section_67_para_3: 0.450', 'section_87_para_3: 0.450', 'section_29_para_3: 0.450', 'section_57_para_3: 0.450', 'section_81_para_3: 0.450', 'section_63_para_3: 0.450', 'section_33_para_3: 0.450', 'section_31_para_3: 0.450', 'section_3_para_12: 0.450', 'section_39_para_18: 0.450', 'section_40_para_25: 0.449', 'section_20_para_22: 0.449', 'section_71_para_4: 0.449', 'section_72_para_10: 0.449', 'section_8_para_24: 0.449', 'section_33_para_20: 0.448', 'section_65_para_19: 0.448', 'section_23_para_19: 0.447', 'section_85_para_9: 0.447', 'section_70_para_10: 0.447', 'section_86_para_22: 0.446', 'section_37_para_16: 0.446', 'section_40_para_8: 0.446', 'section_0_para_3: 0.446', 'section_43_para_17: 0.446', 'section_14_para_24: 0.445', 'section_41_para_4: 0.445', 'section_52_para_7: 0.445', 'section_18_para_4: 0.445', 'section_59_para_12: 0.445', 'section_64_para_11: 0.445', 'section_39_para_9: 0.445', 'section_61_para_14: 0.444', 'section_64_para_24: 0.444', 'section_61_para_22: 0.444', 'section_9_para_15: 0.444', 'section_66_para_16: 0.444', 'section_84_para_11: 0.444', 'section_37_para_23: 0.444', 'section_47_para_23: 0.443', 'section_3_para_6: 0.443', 'section_72_para_25: 0.443', 'section_25_para_11: 0.443', 'section_12_para_22: 0.443', 'section_75_para_25: 0.443', 'section_59_para_9: 0.443', 'section_83_para_14: 0.443', 'section_40_para_22: 0.442', 'section_51_para_10: 0.442', 'section_37_para_19: 0.442', 'section_16_para_5: 0.442', 'section_47_para_12: 0.442', 'section_75_para_15: 0.442', 'section_87_para_14: 0.442', 'section_72_para_12: 0.442', 'section_14_para_5: 0.441', 'section_21_para_20: 0.441', 'section_40_para_24: 0.441', 'section_14_para_14: 0.441', 'section_58_para_9: 0.440', 'section_71_para_12: 0.439', 'section_28_para_14: 0.439', 'section_78_para_27: 0.438', 'section_38_para_5: 0.438', 'section_72_para_15: 0.438', 'section_84_para_20: 0.437', 'section_14_para_6: 0.437', 'section_10_para_16: 0.437', 'section_83_para_4: 0.437', 'section_25_para_27: 0.436', 'section_18_para_21: 0.436', 'section_20_para_23: 0.435', 'section_81_para_5: 0.435', 'section_42_para_22: 0.434', 'section_22_para_16: 0.434', 'section_41_para_26: 0.434', 'section_90_para_25: 0.434', 'section_61_para_23: 0.434', 'section_42_para_18: 0.433', 'section_48_para_10: 0.433', 'section_92_para_24: 0.433', 'section_50_para_8: 0.433', 'section_4_para_21: 0.433', 'section_77_para_23: 0.432', 'section_61_para_10: 0.432', 'section_80_para_14: 0.432', 'section_11_para_6: 0.431', 'section_6_para_17: 0.431', 'section_41_para_22: 0.431', 'section_80_para_10: 0.431', 'section_26_para_13: 0.431', 'section_45_para_21: 0.430', 'section_30_para_4: 0.430', 'section_37_para_17: 0.430', 'section_16_para_26: 0.430', 'section_42_para_25: 0.429', 'section_86_para_8: 0.429', 'section_21_para_10: 0.429', 'section_23_para_5: 0.429', 'section_36_para_9: 0.428', 'section_51_para_9: 0.427', 'section_42_para_20: 0.427', 'section_35_para_6: 0.427', 'section_6_para_9: 0.427', 'section_17_para_21: 0.427', 'section_74_para_4: 0.426', 'section_57_para_27: 0.426', 'section_25_para_19: 0.426', 'section_91_para_19: 0.425', 'section_9_para_18: 0.425', 'section_14_para_9: 0.425', 'section_27_para_8: 0.425', 'section_51_para_18: 0.424', 'section_82_para_9: 0.424', 'section_57_para_6: 0.424', 'section_39_para_16: 0.423', 'section_14_para_10: 0.423', 'section_28_para_20: 0.423', 'section_66_para_11: 0.422', 'section_89_para_23: 0.422', 'section_63_para_14: 0.422', 'section_50_para_19: 0.422', 'section_92_para_4: 0.421', 'section_28_para_13: 0.421', 'section_84_para_10: 0.421', 'section_68_para_16: 0.421', 'section_39_para_22: 0.421', 'section_37_para_15: 0.421', 'section_50_para_10: 0.420', 'section_1_para_9: 0.420', 'section_15_para_18: 0.420', 'section_50_para_16: 0.419', 'section_47_para_17: 0.419', 'section_30_para_10: 0.419', 'section_10_para_26: 0.419', 'section_22_para_12: 0.419', 'section_70_para_13: 0.419', 'section_54_para_24: 0.419', 'section_15_para_16: 0.419', 'section_64_para_13: 0.418', 'section_22_para_24: 0.418', 'section_11_para_16: 0.418', 'section_92_para_14: 0.418', 'section_91_para_23: 0.418', 'section_60_para_23: 0.418', 'section_91_para_6: 0.418', 'section_9_para_9: 0.418', 'section_35_para_12: 0.418', 'section_2_para_15: 0.417', 'section_20_para_16: 0.417', 'section_91_para_12: 0.417', 'section_21_para_13: 0.417', 'section_73_para_15: 0.417', 'section_72_para_20: 0.417', 'section_25_para_23: 0.416', 'section_77_para_11: 0.416', 'section_58_para_20: 0.416', 'section_9_para_22: 0.416', 'section_94_para_20: 0.416', 'section_34_para_10: 0.416', 'section_67_para_19: 0.416', 'section_84_para_8: 0.416', 'section_9_para_27: 0.415', 'section_23_para_20: 0.415', 'section_83_para_7: 0.415', 'section_56_para_26: 0.415', 'section_5_para_9: 0.415', 'section_49_para_22: 0.415', 'section_72_para_6: 0.415', 'section_6_para_16: 0.415', 'section_58_para_23: 0.415', 'section_80_para_19: 0.414', 'section_27_para_10: 0.414', 'section_70_para_5: 0.414', 'section_22_para_25: 0.414', 'section_61_para_26: 0.414', 'section_49_para_15: 0.414', 'section_11_para_10: 0.413', 'section_0_para_17: 0.412', 'section_15_para_20: 0.411', 'section_39_para_24: 0.411', 'section_73_para_17: 0.411', 'section_23_para_9: 0.411', 'section_25_para_13: 0.410', 'section_30_para_16: 0.410', 'section_71_para_7: 0.410', 'section_14_para_8: 0.409', 'section_49_para_26: 0.409', 'section_82_para_16: 0.409', 'section_32_para_18: 0.409', 'section_59_para_13: 0.409', 'section_40_para_6: 0.409', 'section_57_para_15: 0.409', 'section_12_para_23: 0.408', 'section_8_para_22: 0.408', 'section_20_para_17: 0.408', 'section_76_para_10: 0.408', 'section_22_para_5: 0.408', 'section_71_para_15: 0.408', 'section_23_para_11: 0.408', 'section_80_para_9: 0.407', 'section_66_para_6: 0.407', 'section_79_para_23: 0.407', 'section_56_para_9: 0.407', 'section_52_para_20: 0.406', 'section_71_para_22: 0.406', 'section_36_para_12: 0.406', 'section_14_para_22: 0.406', 'section_75_para_13: 0.405', 'section_28_para_22: 0.405', 'section_90_para_12: 0.405', 'section_91_para_17: 0.405', 'section_48_para_27: 0.404', 'section_35_para_8: 0.404', 'section_28_para_21: 0.404', 'section_45_para_12: 0.404', 'section_12_para_12: 0.404', 'section_64_para_4: 0.404', 'section_41_para_9: 0.404', 'section_41_para_21: 0.404', 'section_40_para_18: 0.403', 'section_15_para_12: 0.403', 'section_16_para_6: 0.403', 'section_65_para_5: 0.403', 'section_7_para_5: 0.403', 'section_61_para_18: 0.402', 'section_17_para_17: 0.402', 'section_35_para_7: 0.402', 'section_25_para_25: 0.402', 'section_72_para_16: 0.402', 'section_17_para_27: 0.402', 'section_37_para_22: 0.401', 'section_66_para_27: 0.401', 'section_11_para_21: 0.401', 'section_92_para_21: 0.401', 'section_8_para_5: 0.401', 'section_52_para_9: 0.400', 'section_44_para_6: 0.400', 'section_82_para_11: 0.400', 'section_19_para_17: 0.400', 'section_62_para_9: 0.400', 'section_9_para_13: 0.399', 'section_62_para_4: 0.399', 'section_61_para_27: 0.398', 'section_69_para_11: 0.398', 'section_10_para_13: 0.398', 'section_80_para_8: 0.398', 'section_93_para_20: 0.398', 'section_73_para_21: 0.397', 'section_51_para_16: 0.397', 'section_29_para_23: 0.397', 'section_36_para_7: 0.396', 'section_43_para_18: 0.396', 'section_17_para_19: 0.396', 'section_11_para_4: 0.396', 'section_66_para_7: 0.396', 'section_18_para_10: 0.396', 'section_29_para_9: 0.396', 'section_58_para_18: 0.395', 'section_74_para_19: 0.395', 'section_10_para_4: 0.395', 'section_38_para_12: 0.395', 'section_92_para_18: 0.395', 'section_15_para_27: 0.395', 'section_40_para_21: 0.395', 'section_77_para_19: 0.394', 'section_63_para_12: 0.394', 'section_19_para_10: 0.394', 'section_85_para_20: 0.393', 'section_21_para_18: 0.393', 'section_85_para_6: 0.393', 'section_44_para_24: 0.393', 'section_31_para_19: 0.393', 'section_88_para_7: 0.392', 'section_39_para_17: 0.392', 'section_25_para_21: 0.391', 'section_67_para_26: 0.391', 'section_16_para_8: 0.391', 'section_82_para_24: 0.391', 'section_91_para_24: 0.391', 'section_3_para_26: 0.391', 'section_31_para_15: 0.391', 'section_44_para_20: 0.391', 'section_90_para_8: 0.390', 'section_70_para_11: 0.390', 'section_4_para_27: 0.390', 'section_19_para_6: 0.390', 'section_23_para_22: 0.389', 'section_62_para_23: 0.389', 'section_72_para_9: 0.389', 'section_84_para_27: 0.389', 'section_29_para_8: 0.389', 'section_61_para_11: 0.388', 'section_19_para_22: 0.388', 'section_11_para_8: 0.388', 'section_28_para_10: 0.388', 'section_22_para_21: 0.388', 'section_47_para_13: 0.388', 'section_49_para_13: 0.388', 'section_66_para_12: 0.387', 'section_70_para_8: 0.387', 'section_12_para_13: 0.387', 'section_75_para_21: 0.387', 'section_95_para_6: 0.387', 'section_12_para_6: 0.387', 'section_38_para_8: 0.386', 'section_80_para_11: 0.386', 'section_57_para_25: 0.385', 'section_73_para_19: 0.385', 'section_22_para_22: 0.385', 'section_21_para_26: 0.385', 'section_42_para_7: 0.385', 'section_29_para_22: 0.385', 'section_46_para_9: 0.385', 'section_75_para_9: 0.384', 'section_2_para_16: 0.384', 'section_38_para_16: 0.384', 'section_23_para_16: 0.383', 'section_28_para_24: 0.383', 'section_50_para_11: 0.383', 'section_35_para_15: 0.383', 'section_44_para_21: 0.383', 'section_16_para_4: 0.383', 'section_10_para_14: 0.382', 'section_20_para_19: 0.382', 'section_21_para_7: 0.382', 'section_26_para_9: 0.382', 'section_39_para_23: 0.382', 'section_58_para_4: 0.382', 'section_61_para_24: 0.382', 'section_62_para_25: 0.382', 'section_65_para_18: 0.382', 'section_41_para_6: 0.382', 'section_18_para_7: 0.382', 'section_95_para_7: 0.381', 'section_43_para_8: 0.381', 'section_73_para_5: 0.381', 'section_42_para_12: 0.381', 'section_47_para_10: 0.381', 'section_29_para_4: 0.381', 'section_15_para_4: 0.380', 'section_72_para_26: 0.380', 'section_43_para_9: 0.380', 'section_9_para_12: 0.380', 'section_70_para_14: 0.379', 'section_41_para_20: 0.379', 'section_34_para_19: 0.379', 'section_67_para_17: 0.378', 'section_2_para_5: 0.378', 'section_33_para_26: 0.378', 'section_26_para_11: 0.378', 'section_53_para_21: 0.378', 'section_61_para_25: 0.377', 'section_64_para_16: 0.377', 'section_14_para_18: 0.377', 'section_12_para_21: 0.377', 'section_80_para_7: 0.377', 'section_94_para_9: 0.377', 'section_74_para_24: 0.377', 'section_21_para_22: 0.376', 'section_49_para_8: 0.376', 'section_57_para_9: 0.376', 'section_24_para_13: 0.376', 'section_16_para_10: 0.376', 'section_46_para_25: 0.376', 'section_78_para_10: 0.375', 'section_60_para_7: 0.375', 'section_73_para_13: 0.375', 'section_34_para_20: 0.375', 'section_72_para_17: 0.374', 'section_10_para_15: 0.374', 'section_16_para_11: 0.374', 'section_67_para_25: 0.374', 'section_16_para_23: 0.374', 'section_84_para_13: 0.373', 'section_48_para_9: 0.373', 'section_90_para_7: 0.373', 'section_22_para_14: 0.373', 'section_8_para_7: 0.373', 'section_22_para_15: 0.373', 'section_88_para_4: 0.373', 'section_35_para_24: 0.373', 'section_87_para_5: 0.373', 'section_29_para_27: 0.373', 'section_39_para_15: 0.373', 'section_40_para_11: 0.373', 'section_19_para_11: 0.372', 'section_9_para_4: 0.372', 'section_85_para_19: 0.372', 'section_15_para_19: 0.372', 'section_39_para_11: 0.372', 'section_55_para_20: 0.372', 'section_72_para_24: 0.371', 'section_75_para_12: 0.371', 'section_91_para_11: 0.371', 'section_50_para_7: 0.371', 'section_48_para_8: 0.371', 'section_66_para_15: 0.370', 'section_59_para_21: 0.370', 'section_83_para_18: 0.370', 'section_39_para_8: 0.370', 'section_24_para_12: 0.370', 'section_72_para_21: 0.370', 'section_61_para_13: 0.370', 'section_42_para_8: 0.370', 'section_94_para_12: 0.369', 'section_49_para_24: 0.369', 'section_91_para_9: 0.369', 'section_15_para_6: 0.369', 'section_34_para_12: 0.368', 'section_54_para_7: 0.368', 'section_21_para_19: 0.368', 'section_45_para_19: 0.368', 'section_82_para_5: 0.368', 'section_6_para_22: 0.367', 'section_15_para_23: 0.367', 'section_0_para_9: 0.367', 'section_10_para_11: 0.367', 'section_32_para_23: 0.367', 'section_75_para_5: 0.366', 'section_11_para_11: 0.366', 'section_56_para_27: 0.366', 'section_22_para_18: 0.366', 'section_63_para_20: 0.366', 'section_30_para_24: 0.365', 'section_38_para_15: 0.365', 'section_15_para_8: 0.365', 'section_52_para_14: 0.365', 'section_34_para_23: 0.365', 'section_74_para_21: 0.365']\n",
      "[INFO] Preprocessing time: 268.808 seconds\n",
      "[INFO] Time for the fgw computation : 179.5402 seconds\n",
      "[DEBUG] mid=466, fgw_dist=0.0663, distance_restante=1.3000\n"
     ]
    }
   ],
   "source": [
    "# Load LongBench-v2 dataset\n",
    "import pandas as pd\n",
    "import time\n",
    "# Login using e.g. `huggingface-cli login` to access this dataset\n",
    "df = pd.read_json(\"hf://datasets/zai-org/LongBench-v2/data.json\")\n",
    "\n",
    "print(f\"Dataset loaded with {len(df)} samples\")\n",
    "print(f\"Columns: {df.columns.tolist()}\")\n",
    "print(f\"Sample domains: {df['domain'].value_counts().head()}\")\n",
    "\n",
    "# Graph generation from LongBench-v2 dataset\n",
    "\"\"\"\n",
    "graphs, questions, choices, ground_truth_answers = generate_graphs_from_longbench_df(\n",
    "    df, start_index=0, max_items=100  # Limited to 100 for testing, remove max_items to process all\n",
    ")\n",
    "\"\"\"\n",
    "\n",
    "graphs, questions, choices, ground_truth_answers = load_longbench_data()\n",
    "\n",
    "\n",
    "# Alternative: LLM use for testing purposes\n",
    "# context, questions, choices, ground_truth_answers = llm_only_longbench_df(\n",
    "#     df, start_index=0, max_items=100\n",
    "# )\n",
    "\n",
    "answers = {}\n",
    "i = 0\n",
    "\n",
    "for qid, G in graphs.items():\n",
    "    try:\n",
    "        if qid != \"66f36490821e116aacb2cc22\":\n",
    "            continue\n",
    "        print(f'qid: {qid}')\n",
    "            \n",
    "        time_start = time.time()\n",
    "\n",
    "        if len(G.nodes) == 0:\n",
    "            raise ValueError(\"Empty graph\")\n",
    "\n",
    "        embeddings = {n: model.encode(G.nodes[n][\"text\"], normalize_embeddings=True) for n in G.nodes}\n",
    "        embedding_store = EmbeddingStore(vectors=embeddings)\n",
    "        question = questions[qid]\n",
    "        question_choices = choices[qid]\n",
    "\n",
    "        path_with_scores = recursive_traversal_with_score_fusion_fgw_genetic_optimized(\n",
    "            \"document\", question, embedding_store, G, model,\n",
    "            sim_threshold=0.4, fgw_threshold=1.3, alpha=0.8,\n",
    "            structure_distance='similarity_weighted'\n",
    "        )\n",
    "\n",
    "        node_ids = [nid for nid in path_with_scores]\n",
    "        last_step = node_ids[-1]  # TraversalStep object\n",
    "        last_node_id = last_step.node_id\n",
    "\n",
    "        context = last_node_id + \": \" + G.nodes[last_node_id][\"text\"]\n",
    "        print(f\"context: {context}\")\n",
    "        prompt = build_EM_prompt_longbench(question, context, question_choices)\n",
    "        \n",
    "        answer = ask_llm_multiple_choice(prompt, client)\n",
    "\n",
    "    except Exception as e:\n",
    "        print(f\"[Error] for qid {qid} : {e}\")\n",
    "        answer = \"A\"  # Default answer in case of error\n",
    "\n",
    "    answers[qid] = answer\n",
    "    ground_truth = ground_truth_answers[qid]\n",
    "    \n",
    "    print(f\"Question {i+1}: {qid}\")\n",
    "    print(f\"Predicted: {answer}, Ground Truth: {ground_truth}\")\n",
    "    print(f\"Correct: {'✓' if answer == ground_truth else '✗'}\")\n",
    "    \n",
    "    i += 1\n",
    "\n",
    "    # Save each 10 iterations\n",
    "    if i % 10 == 0:\n",
    "        results = {\n",
    "            \"answers\": answers,\n",
    "            \"ground_truth\": ground_truth_answers,\n",
    "            \"metadata\": {\n",
    "                \"dataset\": \"LongBench-v2\",\n",
    "                \"method\": \"graph_fusion_fgw\",\n",
    "                \"total_processed\": i\n",
    "            }\n",
    "        }\n",
    "        with open(\"/workspace/longbench-data/longbench_results.json\", \"w\") as f:\n",
    "            json.dump(results, f, indent=2)\n",
    "\n",
    "# Final Save\n",
    "results = {\n",
    "    \"answers\": answers,\n",
    "    \"ground_truth\": ground_truth_answers,\n",
    "    \"metadata\": {\n",
    "        \"dataset\": \"LongBench-v2\",\n",
    "        \"method\": \"graph_fusion_fgw\",\n",
    "        \"total_processed\": i\n",
    "    }\n",
    "}\n",
    "\n",
    "# Accuracy\n",
    "correct = sum(1 for qid in answers if answers[qid] == ground_truth_answers[qid])\n",
    "total = len(answers)\n",
    "accuracy = correct / total if total > 0 else 0\n",
    "\n",
    "results[\"metadata\"][\"accuracy\"] = accuracy\n",
    "results[\"metadata\"][\"correct_answers\"] = correct\n",
    "results[\"metadata\"][\"total_answers\"] = total\n",
    "\n",
    "print(f\"\\n=== FINAL RESULTS ===\")\n",
    "print(f\"Total processed: {total}\")\n",
    "print(f\"Correct answers: {correct}\")\n",
    "print(f\"Accuracy: {accuracy:.3f} ({accuracy*100:.1f}%)\")\n",
    "\n",
    "with open(\"/workspace/longbench-data/longbench_results_final.json\", \"w\") as f:\n",
    "    json.dump(results, f, indent=2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "548c0dd0-a288-453f-acf1-977766bcf045",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python3 (System)",
   "language": "python",
   "name": "system-python"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
