{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "from GPT import GPT\n",
    "import json\n",
    "import re\n",
    "\n",
    "def query_gpt4(d, start, end):\n",
    "    field_texts = json.load(open(f\"prompt/domain.json\"))[d]\n",
    "    variable_texts = json.load(open(f\"prompt/description/{d}.json\"))\n",
    "    input = f'''You are an expert on the {field_texts}\n",
    "    There are two factors:\n",
    "    {start}: {variable_texts[start]}\n",
    "    {end}: {variable_texts[end]}\n",
    "    Which cause-and-effect relationship is more likely for following causal statements V1 V2?\n",
    "    A. changing V1 causes a change in V2.\n",
    "    B. changing V2 causes a change in V1.\n",
    "    C. changes in V1 and in V2 are not correlated.\n",
    "    D. uncertain.\n",
    "    Provide your final answer within the tags <Answer>A/B/C/D</Answer>.\n",
    "    Analyze the statement: {start} {end}'''\n",
    "    prompts = [input]\n",
    "    chatgpt = GPT(\"gpt-4\", 0.7)\n",
    "    outputs = chatgpt.chatgpt_QA_multi(prompts)\n",
    "    output = outputs[0][\"output\"]\n",
    "    answer = re.findall(r\"<Answer>(.*?)</Answer>\",output)[0]\n",
    "    return input, output, answer"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 92,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "LVEDVOLUME -> CVP\n",
      "LVEDVOLUME -> PCWP\n",
      "LVFAILURE -> HISTORY\n",
      "STROKEVOLUME -> CO\n",
      "ERRCAUTER -> HREKG\n",
      "ERRCAUTER -> HRSAT\n",
      "TPR -> BP\n",
      "KINKEDTUBE -> PRESS\n",
      "KINKEDTUBE -> VENTLUNG\n",
      "PVSAT -> SAO2\n",
      "SAO2 -> CATECHOL\n",
      "SHUNT -> SAO2\n",
      "INTUBATION -> MINVOL\n",
      "INTUBATION -> PRESS\n",
      "INTUBATION -> VENTLUNG\n",
      "DISCONNECT -> VENTTUBE\n",
      "MINVOLSET -> VENTMACH\n",
      "VENTTUBE -> PRESS\n",
      "VENTALV -> PVSAT\n",
      "HR -> HREKG\n",
      "HYPOVOLEMIA => PCWP\n",
      "LVFAILURE => CVP\n",
      "ANAPHYLAXIS => CATECHOL\n",
      "ANAPHYLAXIS => BP\n",
      "TPR => CO\n",
      "PVSAT => CATECHOL\n",
      "PULMEMBOLUS => SAO2\n",
      "PULMEMBOLUS => CO\n",
      "SHUNT => HREKG\n",
      "INTUBATION => HREKG\n",
      "INTUBATION => PVSAT\n",
      "DISCONNECT => HRBP\n",
      "DISCONNECT => HR\n",
      "MINVOLSET => PVSAT\n",
      "MINVOLSET => BP\n",
      "VENTMACH => HRBP\n",
      "VENTTUBE => CO\n",
      "VENTLUNG => CATECHOL\n",
      "VENTALV => CATECHOL\n",
      "ARTCO2 => HR\n",
      "HISTORY <> MINVOLSET\n",
      "HISTORY <> BP\n",
      "CVP <> TPR\n",
      "PCWP <> HRSAT\n",
      "HYPOVOLEMIA <> KINKEDTUBE\n",
      "HYPOVOLEMIA <> SHUNT\n",
      "HYPOVOLEMIA <> VENTLUNG\n",
      "LVEDVOLUME <> PULMEMBOLUS\n",
      "LVFAILURE <> MINVOLSET\n",
      "ERRLOWOUTPUT <> PAP\n",
      "ERRLOWOUTPUT <> VENTMACH\n",
      "HRBP <> BP\n",
      "HREKG <> CO\n",
      "HRSAT <> PRESS\n",
      "HRSAT <> CO\n",
      "KINKEDTUBE <> VENTTUBE\n",
      "PVSAT <> PAP\n",
      "PVSAT <> SHUNT\n",
      "PAP <> VENTMACH\n",
      "SHUNT <> MINVOLSET\n",
      "visit_to_asia -> tuberculosis\n",
      "tuberculosis -> either_turb_or_lung_cancer\n",
      "smoking -> lung_cancer\n",
      "smoking -> bronchitis\n",
      "lung_cancer -> either_turb_or_lung_cancer\n",
      "bronchitis -> dyspnoea\n",
      "either_turb_or_lung_cancer -> positive_xray\n",
      "either_turb_or_lung_cancer -> dyspnoea\n",
      "visit_to_asia => either_turb_or_lung_cancer\n",
      "visit_to_asia => positive_xray\n",
      "visit_to_asia => dyspnoea\n",
      "tuberculosis => positive_xray\n",
      "tuberculosis => dyspnoea\n",
      "smoking => either_turb_or_lung_cancer\n",
      "smoking => positive_xray\n",
      "smoking => dyspnoea\n",
      "lung_cancer => positive_xray\n",
      "lung_cancer => dyspnoea\n",
      "visit_to_asia <> smoking\n",
      "visit_to_asia <> lung_cancer\n",
      "visit_to_asia <> bronchitis\n",
      "tuberculosis <> smoking\n",
      "tuberculosis <> lung_cancer\n",
      "tuberculosis <> bronchitis\n",
      "lung_cancer <> bronchitis\n",
      "bronchitis <> either_turb_or_lung_cancer\n",
      "bronchitis <> positive_xray\n",
      "positive_xray <> dyspnoea\n",
      "Age -> DrivingSkill\n",
      "Age -> SeniorTrain\n",
      "SocioEcon -> RiskAversion\n",
      "SocioEcon -> VehicleYear\n",
      "SocioEcon -> MakeModel\n",
      "RiskAversion -> MakeModel\n",
      "RiskAversion -> DrivQuality\n",
      "RiskAversion -> SeniorTrain\n",
      "RiskAversion -> HomeBase\n",
      "VehicleYear -> RuggedAuto\n",
      "VehicleYear -> Airbag\n",
      "RuggedAuto -> ThisCarDam\n",
      "Accident -> ThisCarDam\n",
      "Accident -> ILiCost\n",
      "MakeModel -> Airbag\n",
      "ThisCarCost -> PropCost\n",
      "Theft -> ThisCarCost\n",
      "CarValue -> ThisCarCost\n",
      "HomeBase -> Theft\n",
      "AntiTheft -> Theft\n",
      "SocioEcon => MedCost\n",
      "RiskAversion => DrivingSkill\n",
      "VehicleYear => ThisCarDam\n",
      "VehicleYear => Accident\n",
      "VehicleYear => Cushioning\n",
      "MakeModel => Theft\n",
      "MakeModel => PropCost\n",
      "MakeModel => OtherCarCost\n",
      "DrivQuality => ThisCarDam\n",
      "Mileage => PropCost\n",
      "Antilock => MedCost\n",
      "DrivingSkill => ThisCarCost\n",
      "DrivingSkill => MedCost\n",
      "SeniorTrain => Accident\n",
      "SeniorTrain => DrivQuality\n",
      "SeniorTrain => ILiCost\n",
      "Theft => PropCost\n",
      "CarValue => PropCost\n",
      "HomeBase => ThisCarCost\n",
      "Airbag => MedCost\n",
      "GoodStudent <> Mileage\n",
      "Age <> Mileage\n",
      "VehicleYear <> HomeBase\n",
      "ThisCarDam <> CarValue\n",
      "ThisCarDam <> MedCost\n",
      "RuggedAuto <> DrivingSkill\n",
      "Accident <> Theft\n",
      "DrivQuality <> CarValue\n",
      "Mileage <> DrivingSkill\n",
      "Antilock <> Cushioning\n",
      "SeniorTrain <> AntiTheft\n",
      "ThisCarCost <> MedCost\n",
      "Theft <> Cushioning\n",
      "CarValue <> HomeBase\n",
      "CarValue <> MedCost\n",
      "HomeBase <> OtherCar\n",
      "HomeBase <> MedCost\n",
      "AntiTheft <> OtherCarCost\n",
      "OtherCarCost <> Airbag\n",
      "OtherCarCost <> ILiCost\n",
      "straaling_1 -> foto_1\n",
      "temp_1 -> mikro_1\n",
      "lai_1 -> foto_1\n",
      "lai_1 -> mikro_1\n",
      "meldug_1 -> lai_1\n",
      "meldug_2 -> meldug_3\n",
      "dm_3 -> dm_4\n",
      "temp_3 -> mikro_3\n",
      "lai_3 -> foto_3\n",
      "lai_3 -> lai_4\n",
      "lai_3 -> mikro_3\n",
      "meldug_3 -> meldug_4\n",
      "straaling_4 -> foto_4\n",
      "mikro_1 -> meldug_2\n",
      "middel_1 -> meldug_2\n",
      "mikro_2 -> meldug_3\n",
      "middel_2 -> meldug_3\n",
      "mikro_3 -> meldug_4\n",
      "nedboer_2 -> mikro_2\n",
      "nedboer_3 -> mikro_3\n",
      "dm_1 => dm_3\n",
      "straaling_1 => dm_1\n",
      "straaling_1 => dm_3\n",
      "temp_1 => dm_1\n",
      "temp_1 => lai_3\n",
      "lai_1 => dm_2\n",
      "meldug_1 => foto_1\n",
      "meldug_1 => meldug_4\n",
      "lai_0 => dm_1\n",
      "temp_2 => dm_2\n",
      "temp_2 => meldug_4\n",
      "lai_2 => dm_4\n",
      "temp_3 => udbytte\n",
      "meldug_4 => udbytte\n",
      "middel_1 => mikro_2\n",
      "middel_1 => udbytte\n",
      "nedboer_1 => foto_2\n",
      "nedboer_1 => meldug_3\n",
      "nedboer_2 => udbytte\n",
      "nedboer_3 => meldug_4\n",
      "dm_1 <> straaling_4\n",
      "dm_1 <> lai_4\n",
      "dm_1 <> mikro_2\n",
      "dm_1 <> nedboer_1\n",
      "foto_1 <> temp_4\n",
      "foto_1 <> mikro_3\n",
      "straaling_1 <> temp_3\n",
      "straaling_1 <> mikro_2\n",
      "straaling_1 <> middel_3\n",
      "temp_1 <> nedboer_2\n",
      "dm_2 <> straaling_3\n",
      "dm_2 <> nedboer_2\n",
      "foto_2 <> nedboer_3\n",
      "straaling_2 <> mikro_2\n",
      "meldug_2 <> nedboer_2\n",
      "meldug_2 <> nedboer_3\n",
      "temp_3 <> temp_4\n",
      "temp_4 <> nedboer_2\n",
      "mikro_2 <> nedboer_3\n",
      "middel_2 <> nedboer_3\n",
      "BirthAsphyxia -> Disease\n",
      "HypDistrib -> LowerBodyO2\n",
      "HypoxiaInO2 -> LowerBodyO2\n",
      "HypoxiaInO2 -> RUQO2\n",
      "CO2 -> CO2Report\n",
      "ChestXray -> XrayReport\n",
      "Grunting -> GruntingReport\n",
      "Disease -> Age\n",
      "Disease -> LVH\n",
      "Disease -> DuctFlow\n",
      "Disease -> LungParench\n",
      "Disease -> LungFlow\n",
      "LVH -> LVHreport\n",
      "CardiacMixing -> HypDistrib\n",
      "CardiacMixing -> HypoxiaInO2\n",
      "LungParench -> HypoxiaInO2\n",
      "LungParench -> CO2\n",
      "LungFlow -> ChestXray\n",
      "Sick -> Grunting\n",
      "Sick -> Age\n",
      "BirthAsphyxia => HypoxiaInO2\n",
      "BirthAsphyxia => Grunting\n",
      "BirthAsphyxia => CO2Report\n",
      "BirthAsphyxia => XrayReport\n",
      "BirthAsphyxia => GruntingReport\n",
      "BirthAsphyxia => Age\n",
      "BirthAsphyxia => LungParench\n",
      "BirthAsphyxia => LungFlow\n",
      "Disease => HypDistrib\n",
      "Disease => Grunting\n",
      "Disease => LowerBodyO2\n",
      "Disease => RUQO2\n",
      "Disease => XrayReport\n",
      "Disease => GruntingReport\n",
      "DuctFlow => LowerBodyO2\n",
      "LungParench => RUQO2\n",
      "LungParench => CO2Report\n",
      "LungParench => XrayReport\n",
      "LungFlow => XrayReport\n",
      "Sick => GruntingReport\n",
      "HypoxiaInO2 <> GruntingReport\n",
      "HypoxiaInO2 <> Sick\n",
      "CO2 <> XrayReport\n",
      "CO2 <> LungFlow\n",
      "ChestXray <> DuctFlow\n",
      "Grunting <> LVHreport\n",
      "Grunting <> Age\n",
      "LVHreport <> LowerBodyO2\n",
      "LVHreport <> CO2Report\n",
      "LVHreport <> XrayReport\n",
      "LVHreport <> LungFlow\n",
      "LowerBodyO2 <> CO2Report\n",
      "RUQO2 <> LVH\n",
      "RUQO2 <> LungFlow\n",
      "CO2Report <> CardiacMixing\n",
      "XrayReport <> LVH\n",
      "GruntingReport <> CardiacMixing\n",
      "LVH <> DuctFlow\n",
      "LVH <> CardiacMixing\n",
      "LungFlow <> Sick\n",
      "Pollution -> Cancer\n",
      "Smoker -> Cancer\n",
      "Cancer -> Xray\n",
      "Cancer -> Dyspnoea\n",
      "Pollution => Xray\n",
      "Pollution => Dyspnoea\n",
      "Smoker => Xray\n",
      "Smoker => Dyspnoea\n",
      "Pollution <> Smoker\n",
      "Xray <> Dyspnoea\n",
      "C_NI_12_00 -> C_NI_12_15\n",
      "CKNI_12_00 -> CKND_12_15\n",
      "CBODD_12_00 -> CBODN_12_15\n",
      "CKND_12_00 -> CKNN_12_15\n",
      "CNOD_12_00 -> CBODD_12_15\n",
      "CBODN_12_00 -> CNON_12_15\n",
      "C_NI_12_15 -> C_NI_12_30\n",
      "CKNI_12_15 -> CKND_12_30\n",
      "CKND_12_15 -> CKND_12_30\n",
      "CNOD_12_15 -> CNON_12_30\n",
      "CBODN_12_15 -> CNON_12_30\n",
      "CKNN_12_15 -> CKND_12_30\n",
      "C_NI_12_30 -> CBODD_12_45\n",
      "CBODD_12_30 -> CBODN_12_45\n",
      "CKND_12_30 -> CKND_12_45\n",
      "CKND_12_30 -> CKNN_12_45\n",
      "CNOD_12_30 -> CBODD_12_45\n",
      "CBODN_12_30 -> CNON_12_45\n",
      "CKNN_12_30 -> CKND_12_45\n",
      "CNON_12_30 -> CBODN_12_45\n",
      "C_NI_12_00 => CNOD_12_45\n",
      "CKNI_12_00 => CKNI_12_45\n",
      "CKNI_12_00 => CBODD_12_45\n",
      "CKNI_12_00 => CKND_12_45\n",
      "CBODD_12_00 => CNOD_12_30\n",
      "CBODD_12_00 => CBODN_12_45\n",
      "CBODN_12_00 => CBODD_12_45\n",
      "CBODN_12_00 => CNON_12_45\n",
      "CKNN_12_00 => CBODN_12_30\n",
      "CKNN_12_00 => CNOD_12_45\n",
      "CNON_12_00 => CBODD_12_30\n",
      "CNON_12_00 => CNON_12_30\n",
      "CNON_12_00 => CNOD_12_45\n",
      "C_NI_12_15 => C_NI_12_45\n",
      "C_NI_12_15 => CNOD_12_45\n",
      "CKNN_12_15 => CNOD_12_45\n",
      "CKNN_12_15 => CBODN_12_45\n",
      "CNON_12_15 => CBODD_12_45\n",
      "CNON_12_15 => CNOD_12_45\n",
      "CNON_12_15 => CBODN_12_45\n",
      "CBODD_12_00 <> CKNN_12_00\n",
      "CBODD_12_00 <> CKNI_12_15\n",
      "CBODD_12_00 <> CKNN_12_30\n",
      "CNOD_12_00 <> CKNN_12_00\n",
      "CNOD_12_00 <> CKNN_12_45\n",
      "CNON_12_00 <> CKNI_12_15\n",
      "CNOD_12_15 <> CKNI_12_30\n",
      "CBODN_12_15 <> CKNI_12_45\n",
      "CBODN_12_15 <> CKNN_12_45\n",
      "CKNN_12_15 <> C_NI_12_30\n",
      "CKNN_12_15 <> CNOD_12_30\n",
      "CNON_12_15 <> CKNN_12_45\n",
      "C_NI_12_30 <> CKNI_12_30\n",
      "C_NI_12_30 <> CBODN_12_30\n",
      "CBODD_12_30 <> CKNI_12_45\n",
      "CNON_12_30 <> CKNN_12_45\n",
      "CKNI_12_45 <> CBODD_12_45\n",
      "CKND_12_45 <> CNOD_12_45\n",
      "CKND_12_45 <> CBODN_12_45\n",
      "CNOD_12_45 <> CNON_12_45\n",
      "komm -> aar_mod\n",
      "forfrugt -> ngodnt\n",
      "jordn -> nprot\n",
      "pesticid -> nopt\n",
      "exptgens -> ngodnt\n",
      "exptgens -> nopt\n",
      "mod_nmin -> ngodnt\n",
      "nopt -> ngodnn\n",
      "saatid -> frspdag\n",
      "rokap -> dgv1059\n",
      "sort -> srtprot\n",
      "sort -> srtsize\n",
      "tkvs -> saakern\n",
      "partigerm -> markgrm\n",
      "frspdag -> jordinf\n",
      "jordinf -> markgrm\n",
      "keraks -> s2225\n",
      "aks_vgt -> ksort\n",
      "srtsize -> slt22\n",
      "ksort -> spndx\n",
      "jordtype => s2528\n",
      "komm => jordn\n",
      "komm => aks_m2\n",
      "nedbarea => ksort\n",
      "nmin => ngtilg\n",
      "aar_mod => ngtilg\n",
      "forfrugt => slt22\n",
      "pesticid => keraks\n",
      "pesticid => ksort\n",
      "exptgens => udb\n",
      "ngodn => s2528\n",
      "rokap => udb\n",
      "sort => ksort\n",
      "nplac => protein\n",
      "dg25 => keraks\n",
      "partigerm => udb\n",
      "partigerm => s2528\n",
      "frspdag => ksort\n",
      "jordinf => aks_vgt\n",
      "antplnt => ksort\n",
      "jordtype <> nedbarea\n",
      "nedbarea <> srtprot\n",
      "nmin <> saatid\n",
      "potnmin <> jordinf\n",
      "potnmin <> dgv5980\n",
      "jordn <> pesticid\n",
      "pesticid <> saakern\n",
      "exptgens <> dgv5980\n",
      "ngodnt <> rokap\n",
      "ngodnt <> bgbyg\n",
      "nopt <> antplnt\n",
      "ngodnn <> jordinf\n",
      "nprot <> saatid\n",
      "rokap <> markgrm\n",
      "dgv1059 <> saamng\n",
      "nplac <> partigerm\n",
      "sorttkv <> bgbyg\n",
      "udb <> tkv\n",
      "tkv <> bgbyg\n",
      "s2225 <> bgbyg\n"
     ]
    }
   ],
   "source": [
    "import json\n",
    "import re\n",
    "\n",
    "sample_dir = \"pairwise_samples/\"\n",
    "gpt_dir = \"out/gpt_history/for_estimation/\"\n",
    "\n",
    "def pairwise(fp):\n",
    "    with open(fp, \"r\") as f:\n",
    "        lines = f.readlines()\n",
    "        for line in lines:\n",
    "            # parse v1,v2 as (v1,v2), v1 and v2 are strings\n",
    "            match = re.match(r\"(.*),(.*)\", line)\n",
    "            if match:\n",
    "                v1, v2 = match.group(1), match.group(2)\n",
    "                yield (v1, v2)\n",
    "\n",
    "## estimate \n",
    "datasets = [\"alarm\", \"asia\", \"insurance\", \"mildew\", \"child\", \"cancer\", \"water\", \"barley\"]\n",
    "pairwise_samples = {d:{\"edge\":[],\"indirect_path\":[],\"no_path_bi\":[]} for d in datasets}\n",
    "for d in datasets:\n",
    "    for v1, v2 in pairwise(f\"{sample_dir}/{d}/direct_connections_str.txt\"):\n",
    "        pairwise_samples[d][\"edge\"].append((v1, v2))\n",
    "    for v1, v2 in pairwise(f\"{sample_dir}/{d}/indirect_connections_str.txt\"):\n",
    "        pairwise_samples[d][\"indirect_path\"].append((v1, v2))\n",
    "    for v1, v2 in pairwise(f\"{sample_dir}/{d}/no_connection_str.txt\"):\n",
    "        pairwise_samples[d][\"no_path_bi\"].append((v1, v2))\n",
    "\n",
    "correct_num = {d:{\"edge\":0,\"indirect_path\":0,\"no_path_bi\":0} for d in datasets}\n",
    "reversed_num = {d:{\"edge\":0,\"indirect_path\":0,\"no_path_bi\":0} for d in datasets}\n",
    "\n",
    "for d in pairwise_samples:\n",
    "    gpt_file = f\"{gpt_dir}/{d}_history.json\"\n",
    "    json_history = json.load(open(gpt_file, \"r\"))\n",
    "    for v1, v2 in pairwise_samples[d][\"edge\"]:\n",
    "        print(f\"{v1} -> {v2}\")\n",
    "        # check if the element with \"start\":v1 and \"end\":v2 or \"start\":v2 and \"end\":v1 exists in the history;\n",
    "        flag = False\n",
    "        reverse_flag = False\n",
    "        for i, history in enumerate(json_history):\n",
    "            if history[\"start\"] == v1 and history[\"end\"] == v2:\n",
    "                flag = True\n",
    "                if history[\"answer\"] == \"A\":\n",
    "                    correct_num[d][\"edge\"] += 1\n",
    "                    reverse_flag = False\n",
    "                    break\n",
    "                if history[\"answer\"] == \"B\":\n",
    "                    reverse_flag = True\n",
    "\n",
    "            elif history[\"start\"] == v2 and history[\"end\"] == v1:\n",
    "                flag = True\n",
    "                if history[\"answer\"] == \"B\":\n",
    "                    correct_num[d][\"edge\"] += 1\n",
    "                    reverse_flag = False\n",
    "                    break\n",
    "                if history[\"answer\"] == \"A\":\n",
    "                    reverse_flag = True\n",
    "        if reverse_flag:\n",
    "            reversed_num[d][\"edge\"] += 1\n",
    "\n",
    "    for v1, v2 in pairwise_samples[d][\"indirect_path\"]:\n",
    "        print(f\"{v1} => {v2}\")\n",
    "        # check if the element with \"start\":v1 and \"end\":v2 or \"start\":v2 and \"end\":v1 exists in the history;\n",
    "        flag = False\n",
    "        reverse_flag = False\n",
    "        for i, history in enumerate(json_history):\n",
    "            if history[\"start\"] == v1 and history[\"end\"] == v2:\n",
    "                flag = True\n",
    "                if history[\"answer\"] == \"A\":\n",
    "                    correct_num[d][\"indirect_path\"] += 1\n",
    "                    reverse_flag = False\n",
    "                    break\n",
    "                if history[\"answer\"] == \"B\":\n",
    "                    reverse_flag = True\n",
    "\n",
    "            elif history[\"start\"] == v2 and history[\"end\"] == v1:\n",
    "                flag = True\n",
    "                if history[\"answer\"] == \"B\":\n",
    "                    correct_num[d][\"indirect_path\"] += 1\n",
    "                    reverse_flag = False\n",
    "                    break\n",
    "                if history[\"answer\"] == \"A\":\n",
    "                    reverse_flag = True\n",
    "        if reverse_flag:\n",
    "            reversed_num[d][\"indirect_path\"] += 1\n",
    "        # if no match query gpt4\n",
    "        if not flag:\n",
    "            input, output, answer = query_gpt4(d, v1, v2)\n",
    "            json_history.append({\"start\":v1, \"end\":v2, \"input\":input, \"output\":output, \"answer\":answer})\n",
    "            with open(gpt_file, \"w\") as f:\n",
    "                json.dump(json_history, f, indent=4)\n",
    "            if answer == \"A\":\n",
    "                correct_num[d][\"indirect_path\"] += 1\n",
    "            if answer == \"B\":\n",
    "                reversed_num[d][\"indirect_path\"] += 1\n",
    "        \n",
    "    for v1, v2 in pairwise_samples[d][\"no_path_bi\"]:\n",
    "        print(f\"{v1} <> {v2}\")\n",
    "        # check if the element with \"start\":v1 and \"end\":v2 or \"start\":v2 and \"end\":v1 exists in the history;\n",
    "        flag = False\n",
    "        for i, history in enumerate(json_history):\n",
    "            if history[\"start\"] == v1 and history[\"end\"] == v2:\n",
    "                flag = True\n",
    "                if history[\"answer\"] in [\"C\",\"D\"]:\n",
    "                    correct_num[d][\"no_path_bi\"] += 1       \n",
    "                    break\n",
    "            elif history[\"start\"] == v2 and history[\"end\"] == v1:\n",
    "                flag = True\n",
    "                if history[\"answer\"] in [\"C\",\"D\"]:\n",
    "                    correct_num[d][\"no_path_bi\"] += 1\n",
    "                    break\n",
    "        # if no match query gpt4\n",
    "        if not flag:\n",
    "            input, output, answer = query_gpt4(d, v1, v2)\n",
    "            json_history.append({\"start\":v1, \"end\":v2, \"input\":input, \"output\":output, \"answer\":answer})\n",
    "            with open(gpt_file, \"w\") as f:\n",
    "                json.dump(json_history, f, indent=4)\n",
    "            if answer in [\"C\",\"D\"]:\n",
    "                correct_num[d][\"no_path_bi\"] += 1\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 93,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'alarm': {'edge': 20, 'indirect_path': 13, 'no_path_bi': 12},\n",
       " 'asia': {'edge': 8, 'indirect_path': 10, 'no_path_bi': 8},\n",
       " 'insurance': {'edge': 17, 'indirect_path': 19, 'no_path_bi': 7},\n",
       " 'mildew': {'edge': 19, 'indirect_path': 20, 'no_path_bi': 2},\n",
       " 'child': {'edge': 20, 'indirect_path': 10, 'no_path_bi': 10},\n",
       " 'cancer': {'edge': 4, 'indirect_path': 4, 'no_path_bi': 0},\n",
       " 'water': {'edge': 19, 'indirect_path': 10, 'no_path_bi': 9},\n",
       " 'barley': {'edge': 14, 'indirect_path': 6, 'no_path_bi': 10}}"
      ]
     },
     "execution_count": 93,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "correct_num"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 94,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'alarm': {'edge': 0, 'indirect_path': 3, 'no_path_bi': 0},\n",
       " 'asia': {'edge': 0, 'indirect_path': 0, 'no_path_bi': 0},\n",
       " 'insurance': {'edge': 1, 'indirect_path': 1, 'no_path_bi': 0},\n",
       " 'mildew': {'edge': 1, 'indirect_path': 0, 'no_path_bi': 0},\n",
       " 'child': {'edge': 0, 'indirect_path': 8, 'no_path_bi': 0},\n",
       " 'cancer': {'edge': 0, 'indirect_path': 0, 'no_path_bi': 0},\n",
       " 'water': {'edge': 1, 'indirect_path': 10, 'no_path_bi': 0},\n",
       " 'barley': {'edge': 1, 'indirect_path': 6, 'no_path_bi': 0}}"
      ]
     },
     "execution_count": 94,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "reversed_num"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 95,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'alarm': {'edge': 1.0, 'indirect_path': 0.65, 'no_path_bi': 0.6},\n",
       " 'asia': {'edge': 1.0, 'indirect_path': 1.0, 'no_path_bi': 0.8},\n",
       " 'insurance': {'edge': 0.85, 'indirect_path': 0.95, 'no_path_bi': 0.35},\n",
       " 'mildew': {'edge': 0.95, 'indirect_path': 1.0, 'no_path_bi': 0.1},\n",
       " 'child': {'edge': 1.0, 'indirect_path': 0.5, 'no_path_bi': 0.5},\n",
       " 'cancer': {'edge': 1.0, 'indirect_path': 1.0, 'no_path_bi': 0.0},\n",
       " 'water': {'edge': 0.95, 'indirect_path': 0.5, 'no_path_bi': 0.45},\n",
       " 'barley': {'edge': 0.7, 'indirect_path': 0.3, 'no_path_bi': 0.5}}"
      ]
     },
     "execution_count": 95,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# calculate the accuraccy and save to a new dict\n",
    "accuracy = {d:{\"edge\":0,\"indirect_path\":0,\"no_path_bi\":0} for d in datasets}\n",
    "for d in datasets:\n",
    "    for k in pairwise_samples[d]:\n",
    "        accuracy[d][k] = correct_num[d][k] / len(pairwise_samples[d][k])\n",
    "accuracy"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 96,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'alarm': {'edge': 0.0, 'indirect_path': 0.15, 'no_path_bi': 0.0},\n",
       " 'asia': {'edge': 0.0, 'indirect_path': 0.0, 'no_path_bi': 0.0},\n",
       " 'insurance': {'edge': 0.05, 'indirect_path': 0.05, 'no_path_bi': 0.0},\n",
       " 'mildew': {'edge': 0.05, 'indirect_path': 0.0, 'no_path_bi': 0.0},\n",
       " 'child': {'edge': 0.0, 'indirect_path': 0.4, 'no_path_bi': 0.0},\n",
       " 'cancer': {'edge': 0.0, 'indirect_path': 0.0, 'no_path_bi': 0.0},\n",
       " 'water': {'edge': 0.05, 'indirect_path': 0.5, 'no_path_bi': 0.0},\n",
       " 'barley': {'edge': 0.05, 'indirect_path': 0.3, 'no_path_bi': 0.0}}"
      ]
     },
     "execution_count": 96,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "acc_reversed = {d:{\"edge\":0,\"indirect_path\":0,\"no_path_bi\":0} for d in datasets}\n",
    "for d in datasets:\n",
    "    for k in pairwise_samples[d]:\n",
    "        acc_reversed[d][k] = reversed_num[d][k] / len(pairwise_samples[d][k])\n",
    "acc_reversed"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 97,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "true_dags = {}\n",
    "for d in datasets:\n",
    "    true_dags[d] = np.loadtxt(f\"BN_structure/{d}_graph.txt\", dtype=int)\n",
    "## calculate the edge number and the path number of the true DAGs\n",
    "\n",
    "edge_num = {d:0 for d in datasets}\n",
    "path_num = {d:0 for d in datasets}\n",
    "node_num = {d:0 for d in datasets}\n",
    "for d in datasets:\n",
    "    node_num[d] = len(true_dags[d])\n",
    "    edge_num[d] = np.sum(true_dags[d])\n",
    "    n = len(true_dags[d])\n",
    "    reachability = true_dags[d].copy()\n",
    "    for k in range(n):\n",
    "        for i in range(n):\n",
    "            for j in range(n):\n",
    "                reachability[i, j] = reachability[i, j] or (\n",
    "                    reachability[i, k] and reachability[k, j])\n",
    "    path_num[d] = np.sum(reachability)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 98,
   "metadata": {},
   "outputs": [],
   "source": [
    "## add a new acc to the accuracy dict, which is the (edge_num * edge_acc + (path_num-edge_num) * path_acc) / path_num\n",
    "## do the same for reversed accuracy\n",
    "for d in datasets:\n",
    "    accuracy[d][\"path_acc\"] = (edge_num[d] * accuracy[d][\"edge\"] + (path_num[d] - edge_num[d]) * accuracy[d][\"indirect_path\"]) / path_num[d]\n",
    "    acc_reversed[d][\"path_acc\"] = (edge_num[d] * acc_reversed[d][\"edge\"] + (path_num[d] - edge_num[d]) * acc_reversed[d][\"indirect_path\"]) / path_num[d]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 99,
   "metadata": {},
   "outputs": [],
   "source": [
    "# add a new column to pairwise_samples, 'path_acc', which equals 'indirectpath'\n",
    "for d in datasets:\n",
    "    pairwise_samples[d][\"path_acc\"] = pairwise_samples[d][\"indirect_path\"]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 100,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'edge': 0.9166666666666666,\n",
       " 'indirect_path': 0.6865671641791045,\n",
       " 'no_path_bi': 0.4393939393939394,\n",
       " 'path_acc': 0.7555929551986658}"
      ]
     },
     "execution_count": 100,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# calculate the weighted accuracy of edge, indirect_path, no_path_bi, repsectively, weighted by the number of samples in each dataset\\\n",
    "weighted_accuracy = {k:0 for k in pairwise_samples[datasets[0]]}\n",
    "for d in datasets:\n",
    "    for k in pairwise_samples[d]:\n",
    "        weighted_accuracy[k] += len(pairwise_samples[d][k]) * accuracy[d][k]\n",
    "for k in pairwise_samples[datasets[0]]:\n",
    "    weighted_accuracy[k] /= sum([len(pairwise_samples[d][k]) for d in datasets])\n",
    "weighted_accuracy"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 101,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'edge': 0.030303030303030304,\n",
       " 'indirect_path': 0.208955223880597,\n",
       " 'no_path_bi': 0.0,\n",
       " 'path_acc': 0.15078649969766383}"
      ]
     },
     "execution_count": 101,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "weighted_reversed_accuracy = {k:0 for k in pairwise_samples[datasets[0]]}\n",
    "for d in datasets:\n",
    "    for k in pairwise_samples[d]:\n",
    "        weighted_reversed_accuracy[k] += len(pairwise_samples[d][k]) * acc_reversed[d][k]\n",
    "for k in pairwise_samples[datasets[0]]:\n",
    "    weighted_reversed_accuracy[k] /= sum([len(pairwise_samples[d][k]) for d in datasets])\n",
    "weighted_reversed_accuracy"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 102,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "p_e: 0.5606060606060606, p_r: 0.15078649969766383, p_r_d: 0.030303030303030304, p_m_d: 0.053030303030303066, p_c: 0.7555929551986658\n"
     ]
    }
   ],
   "source": [
    "## LLM related parameters\n",
    "edge_acc = weighted_accuracy[\"edge\"]\n",
    "ind_acc = weighted_accuracy[\"indirect_path\"]\n",
    "no_acc = weighted_accuracy[\"no_path_bi\"]\n",
    "path_acc = weighted_accuracy[\"path_acc\"]\n",
    "edge_rev = weighted_reversed_accuracy[\"edge\"]\n",
    "ind_rev = weighted_reversed_accuracy[\"indirect_path\"]\n",
    "path_rev = weighted_reversed_accuracy[\"path_acc\"]\n",
    "\n",
    "p_e = 1 - no_acc\n",
    "p_r = path_rev\n",
    "p_r_d = edge_rev\n",
    "p_m_d = 1 - edge_acc - edge_rev\n",
    "p_c = path_acc\n",
    "print(f\"p_e: {p_e}, p_r: {p_r}, p_r_d: {p_r_d}, p_m_d: {p_m_d}, p_c: {p_c}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 112,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "gamma_1: 0.5128619140036711\n"
     ]
    }
   ],
   "source": [
    "# structural related parameters\n",
    "gamma_1_dict = {}\n",
    "for d in datasets:\n",
    "    n, e, p = node_num[d], edge_num[d], path_num[d]\n",
    "    cn2 = n*(n-1) / 2\n",
    "    gamma_1_dict[d] = (cn2 - p) / cn2\n",
    "gamma_1 = np.mean(list(gamma_1_dict.values()))\n",
    "print(f\"gamma_1: {gamma_1}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 131,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "gamma_2: 1.0875914698180322, z_1: 0.8763823919470554, z_2: 0.050014626639769875, pre: 0.05576574731711764\n"
     ]
    }
   ],
   "source": [
    "# CSL related parameters\n",
    "gamma_2_dict = {}\n",
    "z_1_dict = {}\n",
    "z_2_dict = {}\n",
    "pre_dict = {} \n",
    "sizes = [{\"asia\": 250, \"child\": 500, \"insurance\": 500, \"alarm\": 1000, \"cancer\": 250, \"mildew\": 8000, \"water\": 1000, \"barley\": 2000},\n",
    "                             {\"asia\": 1000, \"child\": 2000, \"insurance\": 2000, \"alarm\": 4000, \"cancer\": 1000, \"mildew\": 32000, \"water\": 4000, \"barley\": 8000}]\n",
    "for d in datasets:\n",
    "    true_dag = true_dags[d]\n",
    "    n = true_dag.shape[0]\n",
    "    reachability = true_dags[d].copy()\n",
    "    for k in range(n):\n",
    "        for i in range(n):\n",
    "            for j in range(n):\n",
    "                reachability[i, j] = reachability[i, j] or (\n",
    "                    reachability[i, k] and reachability[k, j])\n",
    "    z_1_dict[d] = {sizes[0][d]:[], sizes[1][d]:[]}\n",
    "    z_2_dict[d] = {sizes[0][d]:[], sizes[1][d]:[]}\n",
    "    gamma_2_dict[d] = {sizes[0][d]:[], sizes[1][d]:[]}\n",
    "    pre_dict[d] = {sizes[0][d]:[], sizes[1][d]:[]}\n",
    "    for s in range(2):\n",
    "        for r in range(6):\n",
    "            fp = f\"out/adj-matrix/{d}-{sizes[s][d]}-{r+1}-MINOBSx-bdeu-iter1.txt\"\n",
    "            ev_dag = np.loadtxt(fp, dtype=int)\n",
    "            gamma_2_dict[d][sizes[s][d]].append(np.sum(ev_dag) / true_dag.shape[0])\n",
    "            if np.sum(ev_dag) == 0:\n",
    "                continue\n",
    "            # z_1 is the ratio of correct edges\n",
    "            z_1_dict[d][sizes[s][d]].append(np.sum(ev_dag * true_dag) / np.sum(ev_dag))\n",
    "            # z_2 is the ratio of reversed edges\n",
    "            z_2_dict[d][sizes[s][d]].append(np.sum(ev_dag * true_dag.T) / np.sum(ev_dag))\n",
    "            # pre is the probability of rechatbility[v1,v2] = 1 given the condition that ev_dag[v2,v1] = 1\n",
    "            pre_dict[d][sizes[s][d]].append(np.sum(reachability * ev_dag.T) / np.sum(ev_dag.T))\n",
    "gamma_2 = np.mean([np.mean(gamma_2_dict[d][sizes[0][d]]) for d in datasets] + [np.mean(gamma_2_dict[d][sizes[1][d]]) for d in datasets])\n",
    "z_1 = np.mean([np.mean(z_1_dict[d][sizes[0][d]]) for d in datasets] + [np.mean(z_1_dict[d][sizes[1][d]]) for d in datasets])\n",
    "z_2 = np.mean([np.mean(z_2_dict[d][sizes[0][d]]) for d in datasets] + [np.mean(z_2_dict[d][sizes[1][d]]) for d in datasets])\n",
    "pre = np.mean([np.mean(pre_dict[d][sizes[0][d]]) for d in datasets] + [np.mean(pre_dict[d][sizes[1][d]]) for d in datasets])\n",
    "print(f\"gamma_2: {gamma_2}, z_1: {z_1}, z_2: {z_2}, pre: {pre}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 132,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.3609673441012883"
      ]
     },
     "execution_count": 132,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "p_e*gamma_1 + p_r*(1-gamma_1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 133,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.09775690104112862"
      ]
     },
     "execution_count": 133,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "((p_r_d+p_m_d)*z_1 + p_m_d*z_2 + (p_r + p_c*pre)*(1-z_1-z_2))*gamma_2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 135,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "1.8462499335439286"
      ]
     },
     "execution_count": 135,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "ours = 0.09775690104112862\n",
    "full = 0.3609673441012883\n",
    "1 /(2*ours / full)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 137,
   "metadata": {},
   "outputs": [],
   "source": [
    "save_dict = {\"llm_sample\":pairwise_samples,\"llm_acc\":accuracy, \"llm_reversed\":acc_reversed,\"gamma1\":gamma_1_dict,\"gamma_2\":gamma_2_dict,\"z_1\":z_1_dict,\"z_2\":z_2_dict,\"pre\":pre_dict}\n",
    "json.dump(save_dict, open(\"out/llm_estimation.json\", \"w\"), indent=4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "para_record = json.load(open(\"out/llm_estimation.json\", \"r\"))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "dict_keys(['llm_sample', 'llm_acc', 'llm_reversed', 'gamma1', 'gamma_2', 'z_1', 'z_2', 'pre'])"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "para_record.keys()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>alarm</th>\n",
       "      <th>asia</th>\n",
       "      <th>insurance</th>\n",
       "      <th>mildew</th>\n",
       "      <th>child</th>\n",
       "      <th>cancer</th>\n",
       "      <th>water</th>\n",
       "      <th>barley</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>edge</th>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.850000</td>\n",
       "      <td>0.950000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.950000</td>\n",
       "      <td>0.700000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>indirect_path</th>\n",
       "      <td>0.650000</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.950000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.500000</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.300000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>no_path_bi</th>\n",
       "      <td>0.600000</td>\n",
       "      <td>0.8</td>\n",
       "      <td>0.350000</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.450000</td>\n",
       "      <td>0.500000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>path_acc</th>\n",
       "      <td>0.722197</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.919048</td>\n",
       "      <td>0.991901</td>\n",
       "      <td>0.695312</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.671676</td>\n",
       "      <td>0.362338</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                  alarm  asia  insurance    mildew     child  cancer  \\\n",
       "edge           1.000000   1.0   0.850000  0.950000  1.000000     1.0   \n",
       "indirect_path  0.650000   1.0   0.950000  1.000000  0.500000     1.0   \n",
       "no_path_bi     0.600000   0.8   0.350000  0.100000  0.500000     0.0   \n",
       "path_acc       0.722197   1.0   0.919048  0.991901  0.695312     1.0   \n",
       "\n",
       "                  water    barley  \n",
       "edge           0.950000  0.700000  \n",
       "indirect_path  0.500000  0.300000  \n",
       "no_path_bi     0.450000  0.500000  \n",
       "path_acc       0.671676  0.362338  "
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "para_record['llm_acc']\n",
    "import pandas as pd\n",
    "\n",
    "llm_acc = pd.DataFrame(para_record['llm_acc'])\n",
    "llm_acc"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>alarm</th>\n",
       "      <th>asia</th>\n",
       "      <th>insurance</th>\n",
       "      <th>mildew</th>\n",
       "      <th>child</th>\n",
       "      <th>cancer</th>\n",
       "      <th>water</th>\n",
       "      <th>barley</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>edge</th>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.05</td>\n",
       "      <td>0.050000</td>\n",
       "      <td>0.00000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.050000</td>\n",
       "      <td>0.050000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>indirect_path</th>\n",
       "      <td>0.150000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.05</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.40000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.300000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>no_path_bi</th>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.00</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.00000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>path_acc</th>\n",
       "      <td>0.119058</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.05</td>\n",
       "      <td>0.008099</td>\n",
       "      <td>0.24375</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.328324</td>\n",
       "      <td>0.261039</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                  alarm  asia  insurance    mildew    child  cancer     water  \\\n",
       "edge           0.000000   0.0       0.05  0.050000  0.00000     0.0  0.050000   \n",
       "indirect_path  0.150000   0.0       0.05  0.000000  0.40000     0.0  0.500000   \n",
       "no_path_bi     0.000000   0.0       0.00  0.000000  0.00000     0.0  0.000000   \n",
       "path_acc       0.119058   0.0       0.05  0.008099  0.24375     0.0  0.328324   \n",
       "\n",
       "                 barley  \n",
       "edge           0.050000  \n",
       "indirect_path  0.300000  \n",
       "no_path_bi     0.000000  \n",
       "path_acc       0.261039  "
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "llm_reversed = pd.DataFrame(para_record[\"llm_reversed\"])\n",
    "llm_reversed"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'alarm': {'edge': 20, 'indirect_path': 20, 'no_path_bi': 20, 'path_acc': 20},\n",
       " 'asia': {'edge': 8, 'indirect_path': 10, 'no_path_bi': 10, 'path_acc': 10},\n",
       " 'insurance': {'edge': 20,\n",
       "  'indirect_path': 20,\n",
       "  'no_path_bi': 20,\n",
       "  'path_acc': 20},\n",
       " 'mildew': {'edge': 20, 'indirect_path': 20, 'no_path_bi': 20, 'path_acc': 20},\n",
       " 'child': {'edge': 20, 'indirect_path': 20, 'no_path_bi': 20, 'path_acc': 20},\n",
       " 'cancer': {'edge': 4, 'indirect_path': 4, 'no_path_bi': 2, 'path_acc': 4},\n",
       " 'water': {'edge': 20, 'indirect_path': 20, 'no_path_bi': 20, 'path_acc': 20},\n",
       " 'barley': {'edge': 20, 'indirect_path': 20, 'no_path_bi': 20, 'path_acc': 20}}"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "llm_sample = para_record[\"llm_sample\"]\n",
    "for d in llm_sample:\n",
    "    for s in llm_sample[d]:\n",
    "        llm_sample[d][s] = len(llm_sample[d][s])\n",
    "llm_sample"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "dict_values([1.2162162162162165, 1.0104166666666667, 1.4351851851851851, 0.7904761904761904, 1.0916666666666666, 0.5500000000000002, 1.3411458333333333, 1.265625])"
      ]
     },
     "execution_count": 21,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "g2 = para_record[\"gamma_2\"]\n",
    "g2_avg = {}\n",
    "for d in g2:\n",
    "    t = 0\n",
    "    for s in g2[d]:\n",
    "        t += sum(g2[d][s])\n",
    "    g2_avg[d] = t / (2*len(g2[d][s]))\n",
    "g2_avg.values()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "dict_values([0.9578342397144431, 0.8773148148148149, 0.9074871522028775, 0.8691919191919192, 0.9806998556998557, 0.9027777777777778, 0.6679817023732718, 0.8374181384479472])"
      ]
     },
     "execution_count": 28,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "z1 = para_record[\"z_1\"]\n",
    "z1_avg = {}\n",
    "for d in z1:\n",
    "    t = 0\n",
    "    num = 0\n",
    "    for s in z1[d]:\n",
    "        \n",
    "        t += sum(z1[d][s])\n",
    "        num += len(z1[d][s])\n",
    "    z1_avg[d] = t / num\n",
    "z1_avg.values()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "dict_values([0.9578342397144431, 0.8773148148148149, 0.9074871522028775, 0.8691919191919192, 0.9806998556998557, 0.9027777777777778, 0.6679817023732718, 0.8374181384479472])"
      ]
     },
     "execution_count": 29,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "z2 = para_record[\"z_2\"]\n",
    "z2_avg = {}\n",
    "for d in z2:\n",
    "    t = 0\n",
    "    num = 0\n",
    "    for s in z2[d]:\n",
    "        \n",
    "        t += sum(z2[d][s])\n",
    "        num += len(z2[d][s])\n",
    "    z2_avg[d] = t / num\n",
    "z2_avg.values()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "dict_values([0.6651651651651652, 0.35714285714285715, 0.5213675213675214, 0.5226890756302521, 0.6631578947368421, 0.2, 0.6512096774193549, 0.5221631205673759])"
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "para_record[\"gamma1\"].values()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import json\n",
    "\n",
    "datasets = [\"alarm\", \"asia\", \"insurance\", \"mildew\", \"child\", \"cancer\", \"water\", \"barley\"]\n",
    "gpt_dir = \"out/gpt_history/for_estimation/\"\n",
    "\n",
    "answer_type_dict = {d:{k:{\"direct_edges\":[],\"reversed_edges\":[],\"indirect_paths\":[],\"reversed_indirect_paths\":[],\"no_connections\":[], \"common_parents\":[], \"common_childs\":[]} for k in [\"A\",\"B\",\"C\"]} for d in datasets}\n",
    "for d in datasets:\n",
    "    mapping = np.loadtxt(f\"BN_structure/mappings/{d}.mapping\", dtype=str)\n",
    "    true_dag = np.loadtxt(f\"BN_structure/{d}_graph.txt\", dtype=int)\n",
    "    n = true_dag.shape[0]\n",
    "    reachability = true_dag.copy()\n",
    "    for k in range(n):\n",
    "        for i in range(n):\n",
    "            for j in range(n):\n",
    "                reachability[i, j] = reachability[i, j] or (\n",
    "                    reachability[i, k] and reachability[k, j])\n",
    "    gpt_file = f\"{gpt_dir}/{d}_history.json\"\n",
    "    json_history = json.load(open(gpt_file, \"r\"))\n",
    "    for i, history in enumerate(json_history):\n",
    "        start = history[\"start\"]\n",
    "        end = history[\"end\"]\n",
    "        if history[\"answer\"] not in [\"A\",\"B\",\"C\"]:\n",
    "            continue\n",
    "        modif_dict = answer_type_dict[d][history[\"answer\"]]\n",
    "        # mapping[i] = start, mapping[j] = end, check true_dag[i][j] and true_dag[j][i]\n",
    "        i = np.where(mapping == start)[0][0]\n",
    "        j = np.where(mapping == end)[0][0]\n",
    "        if true_dag[i][j] == 1:\n",
    "            modif_dict[\"direct_edges\"].append((start, end))\n",
    "        elif true_dag[j][i] == 1:\n",
    "            modif_dict[\"reversed_edges\"].append((start, end))\n",
    "        elif reachability[i][j] == 1:\n",
    "            modif_dict[\"indirect_paths\"].append((start, end))\n",
    "        elif reachability[j][i] == 1:\n",
    "            modif_dict[\"reversed_indirect_paths\"].append((start, end))\n",
    "        else:\n",
    "            modif_dict[\"no_connections\"].append((start, end))\n",
    "            if np.sum(true_dag[i].T * true_dag[j].T) > 0:\n",
    "                modif_dict[\"common_childs\"].append((start, end))\n",
    "            elif np.sum(true_dag[i] * true_dag[j]) > 0:\n",
    "                modif_dict[\"common_parents\"].append((start, end))\n",
    "            \n",
    "        \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'alarm': {'A': {'direct_edges': [('HYPOVOLEMIA', 'LVEDVOLUME'),\n",
       "    ('HYPOVOLEMIA', 'STROKEVOLUME'),\n",
       "    ('LVEDVOLUME', 'CVP'),\n",
       "    ('LVEDVOLUME', 'PCWP'),\n",
       "    ('LVFAILURE', 'LVEDVOLUME'),\n",
       "    ('LVFAILURE', 'STROKEVOLUME'),\n",
       "    ('STROKEVOLUME', 'CO'),\n",
       "    ('ERRLOWOUTPUT', 'HRBP'),\n",
       "    ('ERRCAUTER', 'HREKG'),\n",
       "    ('ERRCAUTER', 'HRSAT'),\n",
       "    ('TPR', 'CATECHOL'),\n",
       "    ('TPR', 'BP'),\n",
       "    ('KINKEDTUBE', 'PRESS'),\n",
       "    ('KINKEDTUBE', 'VENTLUNG'),\n",
       "    ('FIO2', 'PVSAT'),\n",
       "    ('PVSAT', 'SAO2'),\n",
       "    ('PULMEMBOLUS', 'PAP'),\n",
       "    ('PULMEMBOLUS', 'SHUNT'),\n",
       "    ('SHUNT', 'SAO2'),\n",
       "    ('INTUBATION', 'MINVOL'),\n",
       "    ('INTUBATION', 'SHUNT'),\n",
       "    ('INTUBATION', 'PRESS'),\n",
       "    ('INTUBATION', 'VENTLUNG'),\n",
       "    ('INTUBATION', 'VENTALV'),\n",
       "    ('DISCONNECT', 'VENTTUBE'),\n",
       "    ('VENTMACH', 'VENTTUBE'),\n",
       "    ('VENTTUBE', 'PRESS'),\n",
       "    ('VENTTUBE', 'VENTLUNG'),\n",
       "    ('VENTLUNG', 'EXPCO2'),\n",
       "    ('VENTLUNG', 'MINVOL'),\n",
       "    ('VENTALV', 'PVSAT'),\n",
       "    ('VENTALV', 'ARTCO2'),\n",
       "    ('ARTCO2', 'EXPCO2'),\n",
       "    ('CATECHOL', 'HR'),\n",
       "    ('HR', 'HREKG'),\n",
       "    ('HR', 'CO'),\n",
       "    ('CO', 'BP'),\n",
       "    ('LVFAILURE', 'HISTORY'),\n",
       "    ('ANAPHYLAXIS', 'TPR'),\n",
       "    ('VENTLUNG', 'VENTALV'),\n",
       "    ('ARTCO2', 'CATECHOL'),\n",
       "    ('MINVOLSET', 'VENTMACH'),\n",
       "    ('INSUFFANESTH', 'CATECHOL'),\n",
       "    ('SAO2', 'CATECHOL')],\n",
       "   'reversed_edges': [('CATECHOL', 'TPR'), ('HRBP', 'ERRLOWOUTPUT')],\n",
       "   'indirect_paths': [('KINKEDTUBE', 'HR'),\n",
       "    ('VENTALV', 'SAO2'),\n",
       "    ('VENTALV', 'CATECHOL'),\n",
       "    ('FIO2', 'SAO2'),\n",
       "    ('PULMEMBOLUS', 'SAO2'),\n",
       "    ('MINVOLSET', 'VENTTUBE'),\n",
       "    ('LVFAILURE', 'PCWP'),\n",
       "    ('PULMEMBOLUS', 'HRBP'),\n",
       "    ('PULMEMBOLUS', 'HREKG'),\n",
       "    ('ANAPHYLAXIS', 'HREKG'),\n",
       "    ('PVSAT', 'HREKG'),\n",
       "    ('PVSAT', 'HRSAT'),\n",
       "    ('KINKEDTUBE', 'VENTALV'),\n",
       "    ('PVSAT', 'CATECHOL'),\n",
       "    ('SAO2', 'HRSAT'),\n",
       "    ('KINKEDTUBE', 'SAO2'),\n",
       "    ('LVFAILURE', 'CVP'),\n",
       "    ('KINKEDTUBE', 'HRBP'),\n",
       "    ('SAO2', 'HRBP'),\n",
       "    ('ARTCO2', 'HRSAT'),\n",
       "    ('VENTTUBE', 'MINVOL'),\n",
       "    ('ARTCO2', 'HRBP'),\n",
       "    ('ARTCO2', 'HREKG'),\n",
       "    ('VENTTUBE', 'VENTALV'),\n",
       "    ('KINKEDTUBE', 'MINVOL'),\n",
       "    ('LVFAILURE', 'CO'),\n",
       "    ('KINKEDTUBE', 'ARTCO2'),\n",
       "    ('VENTTUBE', 'ARTCO2'),\n",
       "    ('VENTALV', 'EXPCO2'),\n",
       "    ('SHUNT', 'HREKG'),\n",
       "    ('INTUBATION', 'HREKG'),\n",
       "    ('INTUBATION', 'PVSAT'),\n",
       "    ('DISCONNECT', 'HR'),\n",
       "    ('MINVOLSET', 'PVSAT'),\n",
       "    ('VENTMACH', 'HRBP'),\n",
       "    ('VENTTUBE', 'CO'),\n",
       "    ('HYPOVOLEMIA', 'PCWP')],\n",
       "   'reversed_indirect_paths': [],\n",
       "   'no_connections': [('SHUNT', 'PVSAT'),\n",
       "    ('FIO2', 'VENTLUNG'),\n",
       "    ('PULMEMBOLUS', 'PVSAT'),\n",
       "    ('SHUNT', 'MINVOL'),\n",
       "    ('SHUNT', 'VENTLUNG'),\n",
       "    ('SHUNT', 'VENTALV'),\n",
       "    ('INTUBATION', 'VENTTUBE'),\n",
       "    ('DISCONNECT', 'VENTMACH'),\n",
       "    ('VENTALV', 'MINVOL'),\n",
       "    ('SHUNT', 'PAP'),\n",
       "    ('KINKEDTUBE', 'VENTTUBE'),\n",
       "    ('LVFAILURE', 'HRBP'),\n",
       "    ('ERRCAUTER', 'CATECHOL'),\n",
       "    ('ANAPHYLAXIS', 'FIO2'),\n",
       "    ('FIO2', 'PAP'),\n",
       "    ('HYPOVOLEMIA', 'CATECHOL'),\n",
       "    ('PULMEMBOLUS', 'FIO2'),\n",
       "    ('ANAPHYLAXIS', 'CVP'),\n",
       "    ('ANAPHYLAXIS', 'EXPCO2'),\n",
       "    ('MINVOL', 'PVSAT'),\n",
       "    ('MINVOL', 'EXPCO2'),\n",
       "    ('SHUNT', 'EXPCO2'),\n",
       "    ('PRESS', 'PVSAT'),\n",
       "    ('CATECHOL', 'MINVOL'),\n",
       "    ('ERRCAUTER', 'HRBP'),\n",
       "    ('HRSAT', 'HRBP'),\n",
       "    ('ANAPHYLAXIS', 'LVEDVOLUME'),\n",
       "    ('PRESS', 'MINVOL'),\n",
       "    ('HYPOVOLEMIA', 'PAP'),\n",
       "    ('ARTCO2', 'TPR'),\n",
       "    ('LVFAILURE', 'TPR'),\n",
       "    ('PAP', 'HISTORY'),\n",
       "    ('PVSAT', 'TPR'),\n",
       "    ('CATECHOL', 'LVFAILURE'),\n",
       "    ('ERRCAUTER', 'HR'),\n",
       "    ('LVEDVOLUME', 'STROKEVOLUME'),\n",
       "    ('ERRLOWOUTPUT', 'HR'),\n",
       "    ('PCWP', 'HISTORY'),\n",
       "    ('VENTMACH', 'KINKEDTUBE'),\n",
       "    ('HYPOVOLEMIA', 'ERRLOWOUTPUT'),\n",
       "    ('CATECHOL', 'PCWP'),\n",
       "    ('LVEDVOLUME', 'CO'),\n",
       "    ('STROKEVOLUME', 'PCWP'),\n",
       "    ('CO', 'HISTORY'),\n",
       "    ('SAO2', 'HISTORY'),\n",
       "    ('PVSAT', 'LVFAILURE'),\n",
       "    ('HYPOVOLEMIA', 'VENTLUNG'),\n",
       "    ('LVEDVOLUME', 'PULMEMBOLUS'),\n",
       "    ('HREKG', 'CO')],\n",
       "   'common_parents': [('SHUNT', 'PVSAT'),\n",
       "    ('INTUBATION', 'VENTTUBE'),\n",
       "    ('DISCONNECT', 'VENTMACH'),\n",
       "    ('KINKEDTUBE', 'VENTTUBE'),\n",
       "    ('ARTCO2', 'TPR'),\n",
       "    ('ERRCAUTER', 'HR'),\n",
       "    ('ERRLOWOUTPUT', 'HR')],\n",
       "   'common_childs': [('SHUNT', 'PVSAT'),\n",
       "    ('INTUBATION', 'VENTTUBE'),\n",
       "    ('DISCONNECT', 'VENTMACH'),\n",
       "    ('KINKEDTUBE', 'VENTTUBE'),\n",
       "    ('ARTCO2', 'TPR'),\n",
       "    ('ERRCAUTER', 'HR'),\n",
       "    ('ERRLOWOUTPUT', 'HR')]},\n",
       "  'B': {'direct_edges': [('MINVOLSET', 'VENTMACH')],\n",
       "   'reversed_edges': [('HISTORY', 'LVFAILURE'),\n",
       "    ('TPR', 'ANAPHYLAXIS'),\n",
       "    ('LVEDVOLUME', 'HYPOVOLEMIA'),\n",
       "    ('LVEDVOLUME', 'LVFAILURE'),\n",
       "    ('PVSAT', 'FIO2'),\n",
       "    ('SAO2', 'PVSAT'),\n",
       "    ('MINVOL', 'INTUBATION'),\n",
       "    ('PVSAT', 'VENTALV'),\n",
       "    ('SAO2', 'SHUNT'),\n",
       "    ('VENTTUBE', 'DISCONNECT'),\n",
       "    ('VENTTUBE', 'VENTMACH'),\n",
       "    ('VENTLUNG', 'INTUBATION'),\n",
       "    ('VENTALV', 'INTUBATION'),\n",
       "    ('VENTALV', 'VENTLUNG'),\n",
       "    ('PAP', 'PULMEMBOLUS'),\n",
       "    ('SHUNT', 'INTUBATION'),\n",
       "    ('STROKEVOLUME', 'HYPOVOLEMIA'),\n",
       "    ('SHUNT', 'PULMEMBOLUS'),\n",
       "    ('PCWP', 'LVEDVOLUME'),\n",
       "    ('STROKEVOLUME', 'LVFAILURE'),\n",
       "    ('PRESS', 'KINKEDTUBE'),\n",
       "    ('HREKG', 'ERRCAUTER')],\n",
       "   'indirect_paths': [('ANAPHYLAXIS', 'BP'),\n",
       "    ('PULMEMBOLUS', 'CO'),\n",
       "    ('DISCONNECT', 'HRBP'),\n",
       "    ('ANAPHYLAXIS', 'BP'),\n",
       "    ('PULMEMBOLUS', 'CO'),\n",
       "    ('DISCONNECT', 'HRBP')],\n",
       "   'reversed_indirect_paths': [('SAO2', 'PULMEMBOLUS'),\n",
       "    ('PCWP', 'LVFAILURE'),\n",
       "    ('HRBP', 'PULMEMBOLUS'),\n",
       "    ('VENTALV', 'KINKEDTUBE'),\n",
       "    ('HRSAT', 'PVSAT'),\n",
       "    ('SAO2', 'KINKEDTUBE'),\n",
       "    ('HRBP', 'SAO2'),\n",
       "    ('PVSAT', 'KINKEDTUBE'),\n",
       "    ('HR', 'PULMEMBOLUS'),\n",
       "    ('CATECHOL', 'ANAPHYLAXIS'),\n",
       "    ('ARTCO2', 'VENTLUNG')],\n",
       "   'no_connections': [('PVSAT', 'PULMEMBOLUS'),\n",
       "    ('VENTLUNG', 'FIO2'),\n",
       "    ('PVSAT', 'SHUNT'),\n",
       "    ('PAP', 'SHUNT'),\n",
       "    ('FIO2', 'PULMEMBOLUS'),\n",
       "    ('CATECHOL', 'HYPOVOLEMIA'),\n",
       "    ('EXPCO2', 'MINVOL'),\n",
       "    ('EXPCO2', 'SHUNT'),\n",
       "    ('PCWP', 'CVP'),\n",
       "    ('HREKG', 'HRSAT'),\n",
       "    ('PVSAT', 'MINVOL'),\n",
       "    ('ERRLOWOUTPUT', 'HRSAT'),\n",
       "    ('PAP', 'HYPOVOLEMIA'),\n",
       "    ('ARTCO2', 'FIO2'),\n",
       "    ('VENTALV', 'FIO2'),\n",
       "    ('HYPOVOLEMIA', 'SHUNT'),\n",
       "    ('ERRLOWOUTPUT', 'PAP'),\n",
       "    ('PVSAT', 'PAP'),\n",
       "    ('PVSAT', 'SHUNT'),\n",
       "    ('PAP', 'VENTMACH'),\n",
       "    ('SHUNT', 'MINVOLSET')],\n",
       "   'common_parents': [('PVSAT', 'SHUNT'),\n",
       "    ('VENTALV', 'FIO2'),\n",
       "    ('PVSAT', 'SHUNT')],\n",
       "   'common_childs': [('PVSAT', 'SHUNT'),\n",
       "    ('VENTALV', 'FIO2'),\n",
       "    ('PVSAT', 'SHUNT')]},\n",
       "  'C': {'direct_edges': [],\n",
       "   'reversed_edges': [],\n",
       "   'indirect_paths': [],\n",
       "   'reversed_indirect_paths': [('VENTTUBE', 'MINVOLSET'),\n",
       "    ('BP', 'PULMEMBOLUS'),\n",
       "    ('CATECHOL', 'PULMEMBOLUS')],\n",
       "   'no_connections': [('ANAPHYLAXIS', 'ERRLOWOUTPUT'),\n",
       "    ('FIO2', 'LVFAILURE'),\n",
       "    ('LVFAILURE', 'FIO2'),\n",
       "    ('LVFAILURE', 'HYPOVOLEMIA'),\n",
       "    ('DISCONNECT', 'MINVOLSET'),\n",
       "    ('VENTALV', 'SHUNT'),\n",
       "    ('INTUBATION', 'MINVOLSET'),\n",
       "    ('MINVOLSET', 'DISCONNECT'),\n",
       "    ('VENTTUBE', 'KINKEDTUBE'),\n",
       "    ('PULMEMBOLUS', 'INTUBATION'),\n",
       "    ('ERRCAUTER', 'PULMEMBOLUS'),\n",
       "    ('DISCONNECT', 'PULMEMBOLUS'),\n",
       "    ('VENTMACH', 'DISCONNECT'),\n",
       "    ('LVFAILURE', 'ANAPHYLAXIS'),\n",
       "    ('ANAPHYLAXIS', 'ERRCAUTER'),\n",
       "    ('KINKEDTUBE', 'HISTORY'),\n",
       "    ('PULMEMBOLUS', 'HISTORY'),\n",
       "    ('PULMEMBOLUS', 'ERRLOWOUTPUT'),\n",
       "    ('PULMEMBOLUS', 'ANAPHYLAXIS'),\n",
       "    ('DISCONNECT', 'KINKEDTUBE'),\n",
       "    ('ERRCAUTER', 'ANAPHYLAXIS'),\n",
       "    ('INTUBATION', 'ANAPHYLAXIS'),\n",
       "    ('HISTORY', 'ANAPHYLAXIS'),\n",
       "    ('ANAPHYLAXIS', 'INTUBATION'),\n",
       "    ('HISTORY', 'SHUNT'),\n",
       "    ('HYPOVOLEMIA', 'HISTORY'),\n",
       "    ('LVFAILURE', 'INSUFFANESTH'),\n",
       "    ('LVFAILURE', 'MINVOLSET'),\n",
       "    ('ERRLOWOUTPUT', 'HISTORY'),\n",
       "    ('KINKEDTUBE', 'FIO2'),\n",
       "    ('HISTORY', 'LVEDVOLUME'),\n",
       "    ('HISTORY', 'ERRLOWOUTPUT'),\n",
       "    ('HISTORY', 'MINVOLSET'),\n",
       "    ('SHUNT', 'HISTORY'),\n",
       "    ('MINVOLSET', 'HISTORY'),\n",
       "    ('LVEDVOLUME', 'HISTORY'),\n",
       "    ('EXPCO2', 'ERRLOWOUTPUT'),\n",
       "    ('FIO2', 'KINKEDTUBE'),\n",
       "    ('INSUFFANESTH', 'HISTORY'),\n",
       "    ('KINKEDTUBE', 'ERRCAUTER'),\n",
       "    ('CATECHOL', 'HISTORY'),\n",
       "    ('HISTORY', 'INSUFFANESTH'),\n",
       "    ('SHUNT', 'ERRCAUTER'),\n",
       "    ('HYPOVOLEMIA', 'KINKEDTUBE'),\n",
       "    ('STROKEVOLUME', 'DISCONNECT'),\n",
       "    ('ERRLOWOUTPUT', 'FIO2'),\n",
       "    ('MINVOLSET', 'ANAPHYLAXIS'),\n",
       "    ('ERRLOWOUTPUT', 'ANAPHYLAXIS'),\n",
       "    ('FIO2', 'ANAPHYLAXIS'),\n",
       "    ('LVFAILURE', 'PULMEMBOLUS'),\n",
       "    ('ANAPHYLAXIS', 'LVFAILURE'),\n",
       "    ('MINVOLSET', 'LVFAILURE'),\n",
       "    ('ANAPHYLAXIS', 'MINVOLSET'),\n",
       "    ('HISTORY', 'FIO2'),\n",
       "    ('ERRLOWOUTPUT', 'PULMEMBOLUS'),\n",
       "    ('INTUBATION', 'PULMEMBOLUS'),\n",
       "    ('DISCONNECT', 'FIO2'),\n",
       "    ('HYPOVOLEMIA', 'PULMEMBOLUS'),\n",
       "    ('SAO2', 'LVFAILURE'),\n",
       "    ('CVP', 'FIO2'),\n",
       "    ('HYPOVOLEMIA', 'LVFAILURE'),\n",
       "    ('HISTORY', 'HYPOVOLEMIA'),\n",
       "    ('ERRCAUTER', 'HYPOVOLEMIA'),\n",
       "    ('KINKEDTUBE', 'HYPOVOLEMIA'),\n",
       "    ('DISCONNECT', 'INSUFFANESTH'),\n",
       "    ('HISTORY', 'HRBP'),\n",
       "    ('HRBP', 'HISTORY'),\n",
       "    ('ANAPHYLAXIS', 'PCWP'),\n",
       "    ('HISTORY', 'TPR'),\n",
       "    ('TPR', 'HISTORY'),\n",
       "    ('HYPOVOLEMIA', 'INSUFFANESTH'),\n",
       "    ('FIO2', 'INSUFFANESTH'),\n",
       "    ('INSUFFANESTH', 'LVFAILURE'),\n",
       "    ('FIO2', 'PCWP'),\n",
       "    ('ERRLOWOUTPUT', 'HREKG'),\n",
       "    ('INTUBATION', 'HYPOVOLEMIA'),\n",
       "    ('KINKEDTUBE', 'TPR'),\n",
       "    ('SHUNT', 'ERRLOWOUTPUT'),\n",
       "    ('ANAPHYLAXIS', 'HISTORY'),\n",
       "    ('SHUNT', 'INSUFFANESTH'),\n",
       "    ('KINKEDTUBE', 'ERRLOWOUTPUT'),\n",
       "    ('PULMEMBOLUS', 'KINKEDTUBE'),\n",
       "    ('FIO2', 'ERRCAUTER'),\n",
       "    ('ANAPHYLAXIS', 'INSUFFANESTH'),\n",
       "    ('INSUFFANESTH', 'ANAPHYLAXIS'),\n",
       "    ('ANAPHYLAXIS', 'KINKEDTUBE'),\n",
       "    ('STROKEVOLUME', 'HISTORY'),\n",
       "    ('HR', 'HISTORY')],\n",
       "   'common_parents': [('LVFAILURE', 'HYPOVOLEMIA'),\n",
       "    ('VENTTUBE', 'KINKEDTUBE'),\n",
       "    ('PULMEMBOLUS', 'INTUBATION'),\n",
       "    ('VENTMACH', 'DISCONNECT'),\n",
       "    ('INTUBATION', 'PULMEMBOLUS'),\n",
       "    ('HYPOVOLEMIA', 'LVFAILURE')],\n",
       "   'common_childs': [('LVFAILURE', 'HYPOVOLEMIA'),\n",
       "    ('VENTTUBE', 'KINKEDTUBE'),\n",
       "    ('PULMEMBOLUS', 'INTUBATION'),\n",
       "    ('VENTMACH', 'DISCONNECT'),\n",
       "    ('INTUBATION', 'PULMEMBOLUS'),\n",
       "    ('HYPOVOLEMIA', 'LVFAILURE')]}},\n",
       " 'asia': {'A': {'direct_edges': [('tuberculosis',\n",
       "     'either_turb_or_lung_cancer'),\n",
       "    ('smoking', 'bronchitis'),\n",
       "    ('lung_cancer', 'either_turb_or_lung_cancer'),\n",
       "    ('bronchitis', 'dyspnoea'),\n",
       "    ('either_turb_or_lung_cancer', 'positive_xray'),\n",
       "    ('either_turb_or_lung_cancer', 'dyspnoea'),\n",
       "    ('visit_to_asia', 'tuberculosis'),\n",
       "    ('smoking', 'lung_cancer')],\n",
       "   'reversed_edges': [],\n",
       "   'indirect_paths': [('lung_cancer', 'dyspnoea'),\n",
       "    ('smoking', 'either_turb_or_lung_cancer'),\n",
       "    ('smoking', 'dyspnoea'),\n",
       "    ('visit_to_asia', 'dyspnoea'),\n",
       "    ('smoking', 'positive_xray'),\n",
       "    ('tuberculosis', 'dyspnoea'),\n",
       "    ('tuberculosis', 'positive_xray'),\n",
       "    ('lung_cancer', 'positive_xray'),\n",
       "    ('visit_to_asia', 'positive_xray')],\n",
       "   'reversed_indirect_paths': [],\n",
       "   'no_connections': [('smoking', 'tuberculosis')],\n",
       "   'common_parents': [],\n",
       "   'common_childs': []},\n",
       "  'B': {'direct_edges': [],\n",
       "   'reversed_edges': [('bronchitis', 'smoking'),\n",
       "    ('either_turb_or_lung_cancer', 'tuberculosis'),\n",
       "    ('either_turb_or_lung_cancer', 'lung_cancer'),\n",
       "    ('lung_cancer', 'smoking'),\n",
       "    ('tuberculosis', 'visit_to_asia'),\n",
       "    ('dyspnoea', 'bronchitis'),\n",
       "    ('positive_xray', 'either_turb_or_lung_cancer')],\n",
       "   'indirect_paths': [],\n",
       "   'reversed_indirect_paths': [('either_turb_or_lung_cancer', 'smoking'),\n",
       "    ('either_turb_or_lung_cancer', 'visit_to_asia'),\n",
       "    ('dyspnoea', 'smoking'),\n",
       "    ('positive_xray', 'smoking'),\n",
       "    ('dyspnoea', 'visit_to_asia')],\n",
       "   'no_connections': [('tuberculosis', 'smoking'),\n",
       "    ('bronchitis', 'positive_xray')],\n",
       "   'common_parents': [],\n",
       "   'common_childs': []},\n",
       "  'C': {'direct_edges': [],\n",
       "   'reversed_edges': [],\n",
       "   'indirect_paths': [],\n",
       "   'reversed_indirect_paths': [],\n",
       "   'no_connections': [('visit_to_asia', 'lung_cancer'),\n",
       "    ('lung_cancer', 'tuberculosis'),\n",
       "    ('lung_cancer', 'visit_to_asia'),\n",
       "    ('either_turb_or_lung_cancer', 'bronchitis'),\n",
       "    ('positive_xray', 'dyspnoea'),\n",
       "    ('smoking', 'visit_to_asia'),\n",
       "    ('visit_to_asia', 'bronchitis'),\n",
       "    ('bronchitis', 'tuberculosis'),\n",
       "    ('bronchitis', 'visit_to_asia'),\n",
       "    ('bronchitis', 'lung_cancer'),\n",
       "    ('tuberculosis', 'lung_cancer'),\n",
       "    ('lung_cancer', 'bronchitis')],\n",
       "   'common_parents': [('lung_cancer', 'tuberculosis'),\n",
       "    ('either_turb_or_lung_cancer', 'bronchitis'),\n",
       "    ('tuberculosis', 'lung_cancer')],\n",
       "   'common_childs': [('lung_cancer', 'tuberculosis'),\n",
       "    ('either_turb_or_lung_cancer', 'bronchitis'),\n",
       "    ('tuberculosis', 'lung_cancer')]}},\n",
       " 'insurance': {'A': {'direct_edges': [('Age', 'GoodStudent'),\n",
       "    ('Age', 'SocioEcon'),\n",
       "    ('Age', 'RiskAversion'),\n",
       "    ('SocioEcon', 'GoodStudent'),\n",
       "    ('SocioEcon', 'VehicleYear'),\n",
       "    ('SocioEcon', 'MakeModel'),\n",
       "    ('SocioEcon', 'HomeBase'),\n",
       "    ('SocioEcon', 'AntiTheft'),\n",
       "    ('SocioEcon', 'OtherCar'),\n",
       "    ('RiskAversion', 'DrivQuality'),\n",
       "    ('RiskAversion', 'AntiTheft'),\n",
       "    ('RiskAversion', 'DrivHist'),\n",
       "    ('VehicleYear', 'Antilock'),\n",
       "    ('VehicleYear', 'CarValue'),\n",
       "    ('VehicleYear', 'Airbag'),\n",
       "    ('ThisCarDam', 'ThisCarCost'),\n",
       "    ('RuggedAuto', 'ThisCarDam'),\n",
       "    ('RuggedAuto', 'Cushioning'),\n",
       "    ('Accident', 'ThisCarDam'),\n",
       "    ('Accident', 'OtherCarCost'),\n",
       "    ('Accident', 'MedCost'),\n",
       "    ('Accident', 'ILiCost'),\n",
       "    ('MakeModel', 'RuggedAuto'),\n",
       "    ('MakeModel', 'Antilock'),\n",
       "    ('MakeModel', 'CarValue'),\n",
       "    ('MakeModel', 'Airbag'),\n",
       "    ('DrivQuality', 'Accident'),\n",
       "    ('DrivingSkill', 'DrivQuality'),\n",
       "    ('DrivingSkill', 'DrivHist'),\n",
       "    ('ThisCarCost', 'PropCost'),\n",
       "    ('Theft', 'ThisCarCost'),\n",
       "    ('CarValue', 'ThisCarCost'),\n",
       "    ('HomeBase', 'Theft'),\n",
       "    ('Cushioning', 'MedCost'),\n",
       "    ('Airbag', 'Cushioning'),\n",
       "    ('Age', 'DrivingSkill'),\n",
       "    ('SeniorTrain', 'DrivingSkill'),\n",
       "    ('Age', 'SeniorTrain'),\n",
       "    ('Age', 'MedCost'),\n",
       "    ('RiskAversion', 'VehicleYear'),\n",
       "    ('RiskAversion', 'MakeModel'),\n",
       "    ('RiskAversion', 'SeniorTrain'),\n",
       "    ('RuggedAuto', 'OtherCarCost'),\n",
       "    ('Mileage', 'Accident'),\n",
       "    ('Mileage', 'CarValue'),\n",
       "    ('Antilock', 'Accident'),\n",
       "    ('CarValue', 'Theft'),\n",
       "    ('AntiTheft', 'Theft')],\n",
       "   'reversed_edges': [('DrivingSkill', 'Age'),\n",
       "    ('DrivingSkill', 'SeniorTrain'),\n",
       "    ('SeniorTrain', 'Age'),\n",
       "    ('SeniorTrain', 'RiskAversion'),\n",
       "    ('CarValue', 'Mileage'),\n",
       "    ('ThisCarCost', 'CarValue')],\n",
       "   'indirect_paths': [('VehicleYear', 'Theft'),\n",
       "    ('RuggedAuto', 'MedCost'),\n",
       "    ('Accident', 'ThisCarCost'),\n",
       "    ('SocioEcon', 'SeniorTrain'),\n",
       "    ('DrivQuality', 'ThisCarDam'),\n",
       "    ('DrivQuality', 'MedCost'),\n",
       "    ('SocioEcon', 'Airbag'),\n",
       "    ('RiskAversion', 'DrivingSkill'),\n",
       "    ('SeniorTrain', 'DrivQuality'),\n",
       "    ('VehicleYear', 'ThisCarCost'),\n",
       "    ('ThisCarDam', 'PropCost'),\n",
       "    ('RuggedAuto', 'ThisCarCost'),\n",
       "    ('VehicleYear', 'ILiCost'),\n",
       "    ('DrivingSkill', 'MedCost'),\n",
       "    ('Age', 'DrivQuality'),\n",
       "    ('DrivQuality', 'ILiCost'),\n",
       "    ('SeniorTrain', 'ThisCarDam'),\n",
       "    ('Accident', 'PropCost'),\n",
       "    ('DrivQuality', 'OtherCarCost'),\n",
       "    ('VehicleYear', 'Cushioning'),\n",
       "    ('MakeModel', 'Cushioning'),\n",
       "    ('SocioEcon', 'RuggedAuto'),\n",
       "    ('Antilock', 'ThisCarDam'),\n",
       "    ('SeniorTrain', 'DrivHist'),\n",
       "    ('SocioEcon', 'MedCost'),\n",
       "    ('VehicleYear', 'ThisCarDam'),\n",
       "    ('VehicleYear', 'Accident'),\n",
       "    ('MakeModel', 'PropCost'),\n",
       "    ('MakeModel', 'OtherCarCost'),\n",
       "    ('Mileage', 'PropCost'),\n",
       "    ('Antilock', 'MedCost'),\n",
       "    ('DrivingSkill', 'ThisCarCost'),\n",
       "    ('SeniorTrain', 'Accident'),\n",
       "    ('SeniorTrain', 'ILiCost'),\n",
       "    ('Theft', 'PropCost'),\n",
       "    ('CarValue', 'PropCost'),\n",
       "    ('HomeBase', 'ThisCarCost'),\n",
       "    ('Airbag', 'MedCost')],\n",
       "   'reversed_indirect_paths': [('SeniorTrain', 'SocioEcon'),\n",
       "    ('MedCost', 'RuggedAuto'),\n",
       "    ('DrivingSkill', 'RiskAversion'),\n",
       "    ('ThisCarCost', 'VehicleYear'),\n",
       "    ('ThisCarCost', 'RuggedAuto'),\n",
       "    ('ILiCost', 'VehicleYear'),\n",
       "    ('MedCost', 'DrivingSkill')],\n",
       "   'no_connections': [('VehicleYear', 'Mileage'),\n",
       "    ('ThisCarDam', 'MedCost'),\n",
       "    ('MakeModel', 'Mileage'),\n",
       "    ('RuggedAuto', 'Accident'),\n",
       "    ('Theft', 'ThisCarDam'),\n",
       "    ('ILiCost', 'ThisCarDam'),\n",
       "    ('ILiCost', 'ThisCarCost'),\n",
       "    ('Accident', 'RuggedAuto'),\n",
       "    ('ThisCarCost', 'ILiCost'),\n",
       "    ('ThisCarDam', 'ILiCost'),\n",
       "    ('MedCost', 'OtherCarCost'),\n",
       "    ('ThisCarCost', 'Cushioning'),\n",
       "    ('Cushioning', 'ThisCarCost'),\n",
       "    ('OtherCarCost', 'ILiCost'),\n",
       "    ('CarValue', 'Antilock'),\n",
       "    ('ThisCarDam', 'MedCost'),\n",
       "    ('Theft', 'Cushioning'),\n",
       "    ('HomeBase', 'MedCost')],\n",
       "   'common_parents': [('VehicleYear', 'Mileage'),\n",
       "    ('MakeModel', 'Mileage'),\n",
       "    ('RuggedAuto', 'Accident'),\n",
       "    ('Theft', 'ThisCarDam'),\n",
       "    ('Accident', 'RuggedAuto')],\n",
       "   'common_childs': [('VehicleYear', 'Mileage'),\n",
       "    ('MakeModel', 'Mileage'),\n",
       "    ('RuggedAuto', 'Accident'),\n",
       "    ('Theft', 'ThisCarDam'),\n",
       "    ('Accident', 'RuggedAuto')]},\n",
       "  'B': {'direct_edges': [('SocioEcon', 'RiskAversion')],\n",
       "   'reversed_edges': [('VehicleYear', 'SocioEcon'),\n",
       "    ('MakeModel', 'SocioEcon'),\n",
       "    ('CarValue', 'VehicleYear'),\n",
       "    ('CarValue', 'MakeModel'),\n",
       "    ('SocioEcon', 'Age'),\n",
       "    ('GoodStudent', 'SocioEcon'),\n",
       "    ('RiskAversion', 'Age'),\n",
       "    ('ThisCarCost', 'Theft'),\n",
       "    ('ThisCarDam', 'Accident'),\n",
       "    ('Accident', 'DrivQuality'),\n",
       "    ('GoodStudent', 'Age'),\n",
       "    ('DrivQuality', 'RiskAversion'),\n",
       "    ('DrivQuality', 'DrivingSkill'),\n",
       "    ('ThisCarCost', 'ThisCarDam'),\n",
       "    ('ILiCost', 'Accident'),\n",
       "    ('ThisCarDam', 'RuggedAuto'),\n",
       "    ('RuggedAuto', 'MakeModel'),\n",
       "    ('OtherCar', 'SocioEcon'),\n",
       "    ('MedCost', 'Accident'),\n",
       "    ('MedCost', 'Cushioning'),\n",
       "    ('Cushioning', 'Airbag'),\n",
       "    ('Airbag', 'VehicleYear'),\n",
       "    ('Airbag', 'MakeModel'),\n",
       "    ('MedCost', 'Age')],\n",
       "   'indirect_paths': [('MakeModel', 'Theft')],\n",
       "   'reversed_indirect_paths': [('ThisCarCost', 'SocioEcon'),\n",
       "    ('PropCost', 'ThisCarDam'),\n",
       "    ('Airbag', 'SocioEcon'),\n",
       "    ('Accident', 'DrivingSkill')],\n",
       "   'no_connections': [('MedCost', 'ThisCarDam'),\n",
       "    ('GoodStudent', 'Mileage'),\n",
       "    ('Age', 'Mileage'),\n",
       "    ('ThisCarDam', 'CarValue'),\n",
       "    ('RuggedAuto', 'DrivingSkill'),\n",
       "    ('DrivQuality', 'CarValue'),\n",
       "    ('Mileage', 'DrivingSkill'),\n",
       "    ('CarValue', 'HomeBase'),\n",
       "    ('CarValue', 'MedCost'),\n",
       "    ('AntiTheft', 'OtherCarCost'),\n",
       "    ('OtherCarCost', 'Airbag')],\n",
       "   'common_parents': [('ThisCarDam', 'CarValue'), ('CarValue', 'HomeBase')],\n",
       "   'common_childs': [('ThisCarDam', 'CarValue'), ('CarValue', 'HomeBase')]},\n",
       "  'C': {'direct_edges': [('VehicleYear', 'RuggedAuto')],\n",
       "   'reversed_edges': [('RuggedAuto', 'VehicleYear'),\n",
       "    ('Cushioning', 'RuggedAuto')],\n",
       "   'indirect_paths': [],\n",
       "   'reversed_indirect_paths': [('OtherCarCost', 'Mileage'),\n",
       "    ('Theft', 'VehicleYear'),\n",
       "    ('Theft', 'Age'),\n",
       "    ('AntiTheft', 'Age')],\n",
       "   'no_connections': [('Airbag', 'Mileage'),\n",
       "    ('MakeModel', 'VehicleYear'),\n",
       "    ('Airbag', 'RuggedAuto'),\n",
       "    ('Theft', 'GoodStudent'),\n",
       "    ('OtherCarCost', 'Theft'),\n",
       "    ('ThisCarDam', 'Theft'),\n",
       "    ('DrivingSkill', 'Theft'),\n",
       "    ('DrivQuality', 'Theft'),\n",
       "    ('Antilock', 'RuggedAuto'),\n",
       "    ('RuggedAuto', 'Airbag'),\n",
       "    ('VehicleYear', 'MakeModel'),\n",
       "    ('Airbag', 'GoodStudent'),\n",
       "    ('VehicleYear', 'GoodStudent'),\n",
       "    ('Antilock', 'GoodStudent'),\n",
       "    ('SeniorTrain', 'GoodStudent'),\n",
       "    ('ThisCarCost', 'MedCost'),\n",
       "    ('OtherCar', 'GoodStudent'),\n",
       "    ('Antilock', 'Theft'),\n",
       "    ('Theft', 'DrivingSkill'),\n",
       "    ('OtherCar', 'Theft'),\n",
       "    ('ILiCost', 'OtherCarCost'),\n",
       "    ('HomeBase', 'OtherCar'),\n",
       "    ('ILiCost', 'MedCost'),\n",
       "    ('VehicleYear', 'OtherCar'),\n",
       "    ('ILiCost', 'OtherCar'),\n",
       "    ('Accident', 'Theft'),\n",
       "    ('CarValue', 'Airbag'),\n",
       "    ('Antilock', 'Airbag'),\n",
       "    ('DrivQuality', 'AntiTheft'),\n",
       "    ('VehicleYear', 'SeniorTrain'),\n",
       "    ('Airbag', 'SeniorTrain'),\n",
       "    ('Airbag', 'Theft'),\n",
       "    ('SeniorTrain', 'AntiTheft')],\n",
       "   'common_parents': [('MakeModel', 'VehicleYear'),\n",
       "    ('Airbag', 'RuggedAuto'),\n",
       "    ('ThisCarDam', 'Theft'),\n",
       "    ('RuggedAuto', 'Airbag'),\n",
       "    ('VehicleYear', 'MakeModel')],\n",
       "   'common_childs': [('MakeModel', 'VehicleYear'),\n",
       "    ('Airbag', 'RuggedAuto'),\n",
       "    ('ThisCarDam', 'Theft'),\n",
       "    ('RuggedAuto', 'Airbag'),\n",
       "    ('VehicleYear', 'MakeModel')]}},\n",
       " 'mildew': {'A': {'direct_edges': [('dm_1', 'dm_2'),\n",
       "    ('foto_1', 'dm_1'),\n",
       "    ('straaling_1', 'foto_1'),\n",
       "    ('lai_1', 'foto_1'),\n",
       "    ('lai_1', 'lai_2'),\n",
       "    ('meldug_1', 'lai_1'),\n",
       "    ('meldug_1', 'meldug_2'),\n",
       "    ('lai_0', 'lai_1'),\n",
       "    ('foto_2', 'dm_2'),\n",
       "    ('straaling_2', 'foto_2'),\n",
       "    ('lai_2', 'foto_2'),\n",
       "    ('lai_2', 'lai_3'),\n",
       "    ('meldug_2', 'lai_2'),\n",
       "    ('meldug_2', 'meldug_3'),\n",
       "    ('straaling_3', 'foto_3'),\n",
       "    ('lai_3', 'foto_3'),\n",
       "    ('lai_3', 'lai_4'),\n",
       "    ('meldug_3', 'lai_3'),\n",
       "    ('meldug_3', 'meldug_4'),\n",
       "    ('straaling_4', 'foto_4'),\n",
       "    ('lai_4', 'foto_4'),\n",
       "    ('middel_1', 'meldug_2'),\n",
       "    ('middel_2', 'meldug_3'),\n",
       "    ('middel_3', 'meldug_4'),\n",
       "    ('dm_4', 'udbytte'),\n",
       "    ('dm_2', 'dm_3'),\n",
       "    ('temp_2', 'mikro_2'),\n",
       "    ('foto_3', 'dm_3'),\n",
       "    ('temp_3', 'mikro_3'),\n",
       "    ('meldug_4', 'lai_4'),\n",
       "    ('mikro_1', 'meldug_2'),\n",
       "    ('mikro_2', 'meldug_3'),\n",
       "    ('temp_1', 'foto_1'),\n",
       "    ('lai_1', 'mikro_1'),\n",
       "    ('temp_2', 'foto_2'),\n",
       "    ('lai_2', 'mikro_2'),\n",
       "    ('mikro_3', 'meldug_4'),\n",
       "    ('nedboer_2', 'mikro_2'),\n",
       "    ('nedboer_3', 'mikro_3'),\n",
       "    ('temp_3', 'foto_3'),\n",
       "    ('nedboer_1', 'mikro_1'),\n",
       "    ('temp_4', 'foto_4'),\n",
       "    ('dm_3', 'dm_4'),\n",
       "    ('foto_4', 'dm_4'),\n",
       "    ('temp_1', 'mikro_1')],\n",
       "   'reversed_edges': [('meldug_2', 'mikro_1'),\n",
       "    ('mikro_1', 'temp_1'),\n",
       "    ('mikro_2', 'temp_2'),\n",
       "    ('mikro_3', 'temp_3')],\n",
       "   'indirect_paths': [('lai_3', 'dm_3'),\n",
       "    ('mikro_3', 'lai_4'),\n",
       "    ('lai_1', 'dm_1'),\n",
       "    ('lai_4', 'dm_4'),\n",
       "    ('straaling_1', 'dm_1'),\n",
       "    ('meldug_3', 'foto_3'),\n",
       "    ('meldug_4', 'foto_4'),\n",
       "    ('meldug_3', 'dm_3'),\n",
       "    ('lai_2', 'dm_2'),\n",
       "    ('middel_1', 'lai_2'),\n",
       "    ('foto_2', 'dm_4'),\n",
       "    ('lai_1', 'dm_4'),\n",
       "    ('meldug_3', 'dm_4'),\n",
       "    ('meldug_3', 'udbytte'),\n",
       "    ('dm_2', 'dm_4'),\n",
       "    ('lai_3', 'foto_4'),\n",
       "    ('temp_1', 'dm_1'),\n",
       "    ('meldug_2', 'foto_2'),\n",
       "    ('dm_1', 'dm_3'),\n",
       "    ('straaling_1', 'dm_3'),\n",
       "    ('temp_1', 'lai_3'),\n",
       "    ('lai_1', 'dm_2'),\n",
       "    ('meldug_1', 'foto_1'),\n",
       "    ('meldug_1', 'meldug_4'),\n",
       "    ('lai_0', 'dm_1'),\n",
       "    ('temp_2', 'dm_2'),\n",
       "    ('temp_2', 'meldug_4'),\n",
       "    ('lai_2', 'dm_4'),\n",
       "    ('temp_3', 'udbytte'),\n",
       "    ('meldug_4', 'udbytte'),\n",
       "    ('middel_1', 'mikro_2'),\n",
       "    ('middel_1', 'udbytte'),\n",
       "    ('nedboer_1', 'foto_2'),\n",
       "    ('nedboer_1', 'meldug_3'),\n",
       "    ('nedboer_2', 'udbytte'),\n",
       "    ('nedboer_3', 'meldug_4')],\n",
       "   'reversed_indirect_paths': [('lai_2', 'middel_1'),\n",
       "    ('foto_2', 'middel_1'),\n",
       "    ('mikro_1', 'lai_0')],\n",
       "   'no_connections': [('straaling_3', 'lai_3'),\n",
       "    ('straaling_4', 'lai_4'),\n",
       "    ('temp_4', 'lai_4'),\n",
       "    ('straaling_1', 'temp_1'),\n",
       "    ('meldug_4', 'dm_3'),\n",
       "    ('nedboer_1', 'lai_1'),\n",
       "    ('foto_1', 'foto_3'),\n",
       "    ('dm_2', 'foto_3'),\n",
       "    ('straaling_1', 'temp_3'),\n",
       "    ('straaling_1', 'mikro_2'),\n",
       "    ('temp_3', 'temp_4')],\n",
       "   'common_parents': [('straaling_3', 'lai_3'),\n",
       "    ('straaling_4', 'lai_4'),\n",
       "    ('temp_4', 'lai_4'),\n",
       "    ('straaling_1', 'temp_1'),\n",
       "    ('nedboer_1', 'lai_1'),\n",
       "    ('dm_2', 'foto_3')],\n",
       "   'common_childs': [('straaling_3', 'lai_3'),\n",
       "    ('straaling_4', 'lai_4'),\n",
       "    ('temp_4', 'lai_4'),\n",
       "    ('straaling_1', 'temp_1'),\n",
       "    ('nedboer_1', 'lai_1'),\n",
       "    ('dm_2', 'foto_3')]},\n",
       "  'B': {'direct_edges': [('lai_3', 'mikro_3')],\n",
       "   'reversed_edges': [('mikro_1', 'nedboer_1'),\n",
       "    ('mikro_2', 'nedboer_2'),\n",
       "    ('mikro_3', 'nedboer_3'),\n",
       "    ('foto_1', 'temp_1'),\n",
       "    ('lai_1', 'lai_0'),\n",
       "    ('foto_2', 'temp_2'),\n",
       "    ('foto_3', 'temp_3'),\n",
       "    ('foto_4', 'temp_4'),\n",
       "    ('meldug_4', 'mikro_3'),\n",
       "    ('meldug_4', 'middel_3'),\n",
       "    ('foto_3', 'straaling_3'),\n",
       "    ('meldug_3', 'middel_2'),\n",
       "    ('meldug_2', 'middel_1'),\n",
       "    ('lai_4', 'lai_3'),\n",
       "    ('meldug_3', 'mikro_2'),\n",
       "    ('foto_4', 'straaling_4'),\n",
       "    ('meldug_2', 'meldug_1'),\n",
       "    ('foto_1', 'straaling_1'),\n",
       "    ('lai_2', 'lai_1'),\n",
       "    ('lai_3', 'lai_2'),\n",
       "    ('meldug_3', 'meldug_2'),\n",
       "    ('meldug_4', 'meldug_3'),\n",
       "    ('dm_1', 'foto_1'),\n",
       "    ('foto_2', 'straaling_2'),\n",
       "    ('lai_2', 'meldug_2'),\n",
       "    ('dm_2', 'dm_1'),\n",
       "    ('foto_1', 'lai_1'),\n",
       "    ('foto_3', 'lai_3'),\n",
       "    ('dm_2', 'foto_2'),\n",
       "    ('dm_3', 'dm_2'),\n",
       "    ('foto_4', 'lai_4'),\n",
       "    ('dm_3', 'foto_3'),\n",
       "    ('lai_3', 'meldug_3'),\n",
       "    ('udbytte', 'dm_4')],\n",
       "   'indirect_paths': [],\n",
       "   'reversed_indirect_paths': [('lai_4', 'mikro_3'),\n",
       "    ('lai_3', 'middel_2'),\n",
       "    ('dm_3', 'straaling_3'),\n",
       "    ('dm_3', 'lai_3'),\n",
       "    ('lai_2', 'mikro_1'),\n",
       "    ('lai_3', 'mikro_2'),\n",
       "    ('dm_2', 'straaling_2'),\n",
       "    ('dm_2', 'lai_2'),\n",
       "    ('foto_3', 'meldug_2'),\n",
       "    ('foto_3', 'middel_1')],\n",
       "   'no_connections': [('lai_4', 'temp_4'),\n",
       "    ('lai_3', 'straaling_3'),\n",
       "    ('lai_4', 'straaling_4'),\n",
       "    ('lai_1', 'straaling_1'),\n",
       "    ('lai_1', 'temp_1'),\n",
       "    ('lai_2', 'temp_2'),\n",
       "    ('lai_3', 'temp_3'),\n",
       "    ('lai_4', 'straaling_2'),\n",
       "    ('lai_2', 'foto_1'),\n",
       "    ('dm_1', 'straaling_4'),\n",
       "    ('dm_1', 'lai_4'),\n",
       "    ('dm_1', 'mikro_2'),\n",
       "    ('dm_1', 'nedboer_1'),\n",
       "    ('foto_1', 'mikro_3'),\n",
       "    ('straaling_1', 'middel_3'),\n",
       "    ('temp_1', 'nedboer_2'),\n",
       "    ('dm_2', 'straaling_3'),\n",
       "    ('dm_2', 'nedboer_2'),\n",
       "    ('straaling_2', 'mikro_2'),\n",
       "    ('meldug_2', 'nedboer_2'),\n",
       "    ('meldug_2', 'nedboer_3'),\n",
       "    ('temp_4', 'nedboer_2'),\n",
       "    ('mikro_2', 'nedboer_3'),\n",
       "    ('middel_2', 'nedboer_3')],\n",
       "   'common_parents': [('lai_4', 'temp_4'),\n",
       "    ('lai_3', 'straaling_3'),\n",
       "    ('lai_4', 'straaling_4'),\n",
       "    ('lai_1', 'straaling_1'),\n",
       "    ('lai_1', 'temp_1'),\n",
       "    ('lai_2', 'temp_2'),\n",
       "    ('lai_3', 'temp_3')],\n",
       "   'common_childs': [('lai_4', 'temp_4'),\n",
       "    ('lai_3', 'straaling_3'),\n",
       "    ('lai_4', 'straaling_4'),\n",
       "    ('lai_1', 'straaling_1'),\n",
       "    ('lai_1', 'temp_1'),\n",
       "    ('lai_2', 'temp_2'),\n",
       "    ('lai_3', 'temp_3')]},\n",
       "  'C': {'direct_edges': [],\n",
       "   'reversed_edges': [('mikro_1', 'lai_1')],\n",
       "   'indirect_paths': [('lai_3', 'udbytte'),\n",
       "    ('lai_3', 'dm_4'),\n",
       "    ('dm_3', 'udbytte'),\n",
       "    ('foto_4', 'udbytte'),\n",
       "    ('nedboer_2', 'lai_4'),\n",
       "    ('nedboer_3', 'lai_4'),\n",
       "    ('meldug_2', 'mikro_2'),\n",
       "    ('meldug_1', 'mikro_1'),\n",
       "    ('nedboer_1', 'lai_4'),\n",
       "    ('foto_1', 'dm_2'),\n",
       "    ('lai_1', 'meldug_2'),\n",
       "    ('meldug_3', 'mikro_3'),\n",
       "    ('lai_2', 'lai_4'),\n",
       "    ('lai_2', 'dm_4'),\n",
       "    ('foto_2', 'udbytte'),\n",
       "    ('lai_4', 'udbytte'),\n",
       "    ('foto_2', 'dm_3'),\n",
       "    ('meldug_3', 'lai_4'),\n",
       "    ('straaling_1', 'dm_2'),\n",
       "    ('foto_1', 'udbytte'),\n",
       "    ('dm_2', 'udbytte'),\n",
       "    ('foto_3', 'dm_4'),\n",
       "    ('lai_2', 'meldug_3'),\n",
       "    ('meldug_1', 'lai_2'),\n",
       "    ('meldug_2', 'lai_3'),\n",
       "    ('straaling_2', 'udbytte'),\n",
       "    ('meldug_2', 'udbytte'),\n",
       "    ('lai_3', 'meldug_4'),\n",
       "    ('meldug_3', 'foto_4'),\n",
       "    ('meldug_4', 'udbytte'),\n",
       "    ('foto_1', 'dm_3'),\n",
       "    ('lai_1', 'lai_3'),\n",
       "    ('lai_1', 'lai_4'),\n",
       "    ('foto_1', 'dm_4'),\n",
       "    ('meldug_2', 'meldug_4'),\n",
       "    ('lai_2', 'udbytte'),\n",
       "    ('foto_3', 'udbytte'),\n",
       "    ('lai_1', 'udbytte'),\n",
       "    ('middel_2', 'lai_3'),\n",
       "    ('lai_2', 'meldug_4'),\n",
       "    ('meldug_1', 'lai_3'),\n",
       "    ('meldug_2', 'lai_4')],\n",
       "   'reversed_indirect_paths': [('lai_4', 'nedboer_3'),\n",
       "    ('lai_4', 'lai_1'),\n",
       "    ('lai_4', 'lai_0'),\n",
       "    ('lai_4', 'mikro_1'),\n",
       "    ('mikro_2', 'meldug_2'),\n",
       "    ('mikro_1', 'meldug_1'),\n",
       "    ('lai_2', 'meldug_1'),\n",
       "    ('lai_3', 'middel_1'),\n",
       "    ('dm_3', 'straaling_2'),\n",
       "    ('dm_3', 'lai_2'),\n",
       "    ('udbytte', 'foto_4'),\n",
       "    ('udbytte', 'dm_3'),\n",
       "    ('dm_3', 'dm_1'),\n",
       "    ('dm_2', 'lai_1'),\n",
       "    ('dm_2', 'foto_1'),\n",
       "    ('meldug_2', 'lai_1'),\n",
       "    ('dm_3', 'foto_2'),\n",
       "    ('udbytte', 'lai_4'),\n",
       "    ('dm_2', 'straaling_1'),\n",
       "    ('dm_3', 'foto_1'),\n",
       "    ('meldug_3', 'lai_2'),\n",
       "    ('meldug_4', 'lai_3'),\n",
       "    ('lai_4', 'meldug_3'),\n",
       "    ('lai_2', 'lai_0'),\n",
       "    ('lai_3', 'meldug_1'),\n",
       "    ('udbytte', 'lai_3'),\n",
       "    ('lai_3', 'meldug_2'),\n",
       "    ('lai_4', 'middel_1'),\n",
       "    ('meldug_4', 'middel_1'),\n",
       "    ('meldug_3', 'lai_1'),\n",
       "    ('udbytte', 'lai_2'),\n",
       "    ('foto_2', 'lai_1'),\n",
       "    ('dm_3', 'straaling_1'),\n",
       "    ('meldug_4', 'meldug_2'),\n",
       "    ('lai_4', 'middel_2'),\n",
       "    ('meldug_4', 'middel_2'),\n",
       "    ('dm_3', 'lai_1'),\n",
       "    ('lai_3', 'lai_1'),\n",
       "    ('lai_4', 'mikro_2'),\n",
       "    ('lai_4', 'lai_2'),\n",
       "    ('lai_4', 'meldug_2'),\n",
       "    ('meldug_2', 'lai_0'),\n",
       "    ('lai_4', 'meldug_1'),\n",
       "    ('lai_4', 'nedboer_1'),\n",
       "    ('lai_4', 'nedboer_2'),\n",
       "    ('meldug_3', 'middel_1'),\n",
       "    ('meldug_3', 'meldug_1'),\n",
       "    ('lai_4', 'temp_2')],\n",
       "   'no_connections': [('meldug_1', 'lai_0'),\n",
       "    ('lai_0', 'meldug_1'),\n",
       "    ('meldug_3', 'middel_3'),\n",
       "    ('meldug_2', 'middel_2'),\n",
       "    ('middel_3', 'meldug_3'),\n",
       "    ('meldug_1', 'middel_1'),\n",
       "    ('mikro_1', 'middel_1'),\n",
       "    ('middel_2', 'meldug_2'),\n",
       "    ('middel_1', 'meldug_1'),\n",
       "    ('straaling_2', 'temp_2'),\n",
       "    ('lai_2', 'straaling_2'),\n",
       "    ('middel_1', 'mikro_1'),\n",
       "    ('lai_2', 'middel_2'),\n",
       "    ('middel_1', 'lai_1'),\n",
       "    ('straaling_3', 'temp_3'),\n",
       "    ('lai_3', 'straaling_2'),\n",
       "    ('straaling_4', 'temp_4'),\n",
       "    ('temp_1', 'straaling_1'),\n",
       "    ('foto_2', 'dm_1'),\n",
       "    ('middel_3', 'mikro_3'),\n",
       "    ('lai_1', 'middel_1'),\n",
       "    ('meldug_3', 'foto_2'),\n",
       "    ('dm_1', 'foto_2'),\n",
       "    ('middel_3', 'middel_2'),\n",
       "    ('middel_2', 'mikro_2'),\n",
       "    ('foto_2', 'straaling_1'),\n",
       "    ('foto_2', 'lai_3'),\n",
       "    ('temp_3', 'nedboer_3'),\n",
       "    ('temp_2', 'straaling_2'),\n",
       "    ('meldug_4', 'foto_3'),\n",
       "    ('temp_3', 'straaling_3'),\n",
       "    ('meldug_2', 'middel_3'),\n",
       "    ('foto_2', 'foto_1'),\n",
       "    ('lai_2', 'straaling_1'),\n",
       "    ('foto_1', 'middel_1'),\n",
       "    ('lai_3', 'straaling_1'),\n",
       "    ('meldug_4', 'foto_2'),\n",
       "    ('foto_1', 'foto_2'),\n",
       "    ('foto_2', 'foto_3'),\n",
       "    ('foto_3', 'foto_4'),\n",
       "    ('foto_3', 'foto_2'),\n",
       "    ('foto_4', 'foto_3')],\n",
       "   'common_parents': [('meldug_1', 'lai_0'),\n",
       "    ('lai_0', 'meldug_1'),\n",
       "    ('meldug_3', 'middel_3'),\n",
       "    ('meldug_2', 'middel_2'),\n",
       "    ('middel_3', 'meldug_3'),\n",
       "    ('meldug_1', 'middel_1'),\n",
       "    ('mikro_1', 'middel_1'),\n",
       "    ('middel_2', 'meldug_2'),\n",
       "    ('middel_1', 'meldug_1'),\n",
       "    ('straaling_2', 'temp_2'),\n",
       "    ('lai_2', 'straaling_2'),\n",
       "    ('middel_1', 'mikro_1'),\n",
       "    ('straaling_3', 'temp_3'),\n",
       "    ('straaling_4', 'temp_4'),\n",
       "    ('temp_1', 'straaling_1'),\n",
       "    ('foto_2', 'dm_1'),\n",
       "    ('middel_3', 'mikro_3'),\n",
       "    ('dm_1', 'foto_2'),\n",
       "    ('middel_2', 'mikro_2'),\n",
       "    ('temp_3', 'nedboer_3'),\n",
       "    ('temp_2', 'straaling_2'),\n",
       "    ('temp_3', 'straaling_3')],\n",
       "   'common_childs': [('meldug_1', 'lai_0'),\n",
       "    ('lai_0', 'meldug_1'),\n",
       "    ('meldug_3', 'middel_3'),\n",
       "    ('meldug_2', 'middel_2'),\n",
       "    ('middel_3', 'meldug_3'),\n",
       "    ('meldug_1', 'middel_1'),\n",
       "    ('mikro_1', 'middel_1'),\n",
       "    ('middel_2', 'meldug_2'),\n",
       "    ('middel_1', 'meldug_1'),\n",
       "    ('straaling_2', 'temp_2'),\n",
       "    ('lai_2', 'straaling_2'),\n",
       "    ('middel_1', 'mikro_1'),\n",
       "    ('straaling_3', 'temp_3'),\n",
       "    ('straaling_4', 'temp_4'),\n",
       "    ('temp_1', 'straaling_1'),\n",
       "    ('foto_2', 'dm_1'),\n",
       "    ('middel_3', 'mikro_3'),\n",
       "    ('dm_1', 'foto_2'),\n",
       "    ('middel_2', 'mikro_2'),\n",
       "    ('temp_3', 'nedboer_3'),\n",
       "    ('temp_2', 'straaling_2'),\n",
       "    ('temp_3', 'straaling_3')]}},\n",
       " 'child': {'A': {'direct_edges': [('HypDistrib', 'LowerBodyO2'),\n",
       "    ('HypoxiaInO2', 'LowerBodyO2'),\n",
       "    ('CO2', 'CO2Report'),\n",
       "    ('ChestXray', 'XrayReport'),\n",
       "    ('Grunting', 'GruntingReport'),\n",
       "    ('Disease', 'Age'),\n",
       "    ('Disease', 'LVH'),\n",
       "    ('Disease', 'DuctFlow'),\n",
       "    ('Disease', 'LungParench'),\n",
       "    ('Disease', 'LungFlow'),\n",
       "    ('Disease', 'Sick'),\n",
       "    ('LVH', 'LVHreport'),\n",
       "    ('DuctFlow', 'HypDistrib'),\n",
       "    ('CardiacMixing', 'HypDistrib'),\n",
       "    ('LungParench', 'CO2'),\n",
       "    ('LungParench', 'ChestXray'),\n",
       "    ('LungParench', 'Grunting'),\n",
       "    ('LungFlow', 'ChestXray'),\n",
       "    ('Sick', 'Grunting'),\n",
       "    ('Sick', 'Age'),\n",
       "    ('HypoxiaInO2', 'RUQO2'),\n",
       "    ('Disease', 'CardiacMixing'),\n",
       "    ('CardiacMixing', 'HypoxiaInO2'),\n",
       "    ('LungParench', 'HypoxiaInO2'),\n",
       "    ('BirthAsphyxia', 'Disease')],\n",
       "   'reversed_edges': [('LowerBodyO2', 'HypoxiaInO2')],\n",
       "   'indirect_paths': [('Disease', 'LVHreport'),\n",
       "    ('BirthAsphyxia', 'GruntingReport'),\n",
       "    ('BirthAsphyxia', 'LVHreport'),\n",
       "    ('BirthAsphyxia', 'LVH'),\n",
       "    ('BirthAsphyxia', 'RUQO2'),\n",
       "    ('BirthAsphyxia', 'HypoxiaInO2'),\n",
       "    ('LungParench', 'CO2Report'),\n",
       "    ('Disease', 'ChestXray'),\n",
       "    ('LungFlow', 'XrayReport'),\n",
       "    ('BirthAsphyxia', 'CO2Report'),\n",
       "    ('BirthAsphyxia', 'XrayReport'),\n",
       "    ('BirthAsphyxia', 'Age'),\n",
       "    ('BirthAsphyxia', 'LungParench'),\n",
       "    ('Disease', 'GruntingReport')],\n",
       "   'reversed_indirect_paths': [('HypDistrib', 'BirthAsphyxia'),\n",
       "    ('CardiacMixing', 'BirthAsphyxia')],\n",
       "   'no_connections': [('LungFlow', 'LungParench'),\n",
       "    ('LungFlow', 'LVH'),\n",
       "    ('LVH', 'HypDistrib'),\n",
       "    ('LVH', 'DuctFlow'),\n",
       "    ('LVH', 'CardiacMixing'),\n",
       "    ('Grunting', 'XrayReport'),\n",
       "    ('LungParench', 'Sick'),\n",
       "    ('HypoxiaInO2', 'GruntingReport'),\n",
       "    ('HypoxiaInO2', 'Sick'),\n",
       "    ('LowerBodyO2', 'CO2Report'),\n",
       "    ('XrayReport', 'LVH'),\n",
       "    ('LungFlow', 'Sick')],\n",
       "   'common_parents': [('LungFlow', 'LungParench'), ('LungParench', 'Sick')],\n",
       "   'common_childs': [('LungFlow', 'LungParench'), ('LungParench', 'Sick')]},\n",
       "  'B': {'direct_edges': [],\n",
       "   'reversed_edges': [('HypoxiaInO2', 'CardiacMixing'),\n",
       "    ('Disease', 'BirthAsphyxia'),\n",
       "    ('CardiacMixing', 'Disease'),\n",
       "    ('LungParench', 'Disease'),\n",
       "    ('DuctFlow', 'Disease'),\n",
       "    ('CO2', 'LungParench'),\n",
       "    ('CO2Report', 'CO2'),\n",
       "    ('Grunting', 'Sick'),\n",
       "    ('LVH', 'Disease'),\n",
       "    ('LungFlow', 'Disease'),\n",
       "    ('Grunting', 'LungParench'),\n",
       "    ('GruntingReport', 'Grunting'),\n",
       "    ('LVHreport', 'LVH'),\n",
       "    ('HypDistrib', 'DuctFlow'),\n",
       "    ('XrayReport', 'ChestXray')],\n",
       "   'indirect_paths': [('BirthAsphyxia', 'LungFlow'),\n",
       "    ('Disease', 'HypDistrib'),\n",
       "    ('Disease', 'Grunting'),\n",
       "    ('Disease', 'LowerBodyO2'),\n",
       "    ('Disease', 'XrayReport'),\n",
       "    ('LungParench', 'RUQO2'),\n",
       "    ('LungParench', 'XrayReport'),\n",
       "    ('Sick', 'GruntingReport')],\n",
       "   'reversed_indirect_paths': [('LVHreport', 'Disease'),\n",
       "    ('GruntingReport', 'BirthAsphyxia'),\n",
       "    ('LVH', 'BirthAsphyxia'),\n",
       "    ('Grunting', 'BirthAsphyxia')],\n",
       "   'no_connections': [('LVH', 'HypoxiaInO2'),\n",
       "    ('CO2', 'LungFlow'),\n",
       "    ('ChestXray', 'DuctFlow'),\n",
       "    ('LVHreport', 'LowerBodyO2'),\n",
       "    ('RUQO2', 'LungFlow'),\n",
       "    ('CO2Report', 'CardiacMixing')],\n",
       "   'common_parents': [],\n",
       "   'common_childs': []},\n",
       "  'C': {'direct_edges': [],\n",
       "   'reversed_edges': [('Age', 'Sick'), ('Age', 'Disease')],\n",
       "   'indirect_paths': [],\n",
       "   'reversed_indirect_paths': [('DuctFlow', 'BirthAsphyxia'),\n",
       "    ('LVHreport', 'BirthAsphyxia')],\n",
       "   'no_connections': [('HypDistrib', 'LVHreport'),\n",
       "    ('Sick', 'LVHreport'),\n",
       "    ('ChestXray', 'LVHreport'),\n",
       "    ('Grunting', 'ChestXray'),\n",
       "    ('ChestXray', 'CO2'),\n",
       "    ('ChestXray', 'Grunting'),\n",
       "    ('XrayReport', 'LVHreport'),\n",
       "    ('LVHreport', 'XrayReport'),\n",
       "    ('CO2Report', 'Grunting'),\n",
       "    ('CO2Report', 'ChestXray'),\n",
       "    ('LVH', 'GruntingReport'),\n",
       "    ('LVHreport', 'ChestXray'),\n",
       "    ('CO2Report', 'GruntingReport'),\n",
       "    ('HypDistrib', 'Grunting'),\n",
       "    ('LVHreport', 'CO2Report')],\n",
       "   'common_parents': [],\n",
       "   'common_childs': []}},\n",
       " 'cancer': {'A': {'direct_edges': [('Pollution', 'Cancer'),\n",
       "    ('Smoker', 'Cancer'),\n",
       "    ('Cancer', 'Xray'),\n",
       "    ('Cancer', 'Dyspnoea')],\n",
       "   'reversed_edges': [('Xray', 'Cancer')],\n",
       "   'indirect_paths': [('Pollution', 'Dyspnoea'),\n",
       "    ('Pollution', 'Xray'),\n",
       "    ('Smoker', 'Xray'),\n",
       "    ('Smoker', 'Dyspnoea')],\n",
       "   'reversed_indirect_paths': [('Dyspnoea', 'Pollution')],\n",
       "   'no_connections': [('Xray', 'Dyspnoea')],\n",
       "   'common_parents': [],\n",
       "   'common_childs': []},\n",
       "  'B': {'direct_edges': [],\n",
       "   'reversed_edges': [('Cancer', 'Smoker'),\n",
       "    ('Cancer', 'Pollution'),\n",
       "    ('Dyspnoea', 'Cancer')],\n",
       "   'indirect_paths': [],\n",
       "   'reversed_indirect_paths': [],\n",
       "   'no_connections': [('Pollution', 'Smoker'), ('Xray', 'Dyspnoea')],\n",
       "   'common_parents': [('Pollution', 'Smoker')],\n",
       "   'common_childs': [('Pollution', 'Smoker')]},\n",
       "  'C': {'direct_edges': [],\n",
       "   'reversed_edges': [],\n",
       "   'indirect_paths': [],\n",
       "   'reversed_indirect_paths': [],\n",
       "   'no_connections': [],\n",
       "   'common_parents': [],\n",
       "   'common_childs': []}},\n",
       " 'water': {'A': {'direct_edges': [('C_NI_12_00', 'C_NI_12_15'),\n",
       "    ('CKNI_12_00', 'CKNI_12_15'),\n",
       "    ('CKNI_12_00', 'CBODD_12_15'),\n",
       "    ('CKND_12_00', 'CKND_12_15'),\n",
       "    ('CKND_12_00', 'CKNN_12_15'),\n",
       "    ('CNOD_12_00', 'CNON_12_15'),\n",
       "    ('C_NI_12_15', 'C_NI_12_30'),\n",
       "    ('CKNI_12_15', 'CKNI_12_30'),\n",
       "    ('CKNI_12_15', 'CBODD_12_30'),\n",
       "    ('CBODD_12_15', 'CBODD_12_30'),\n",
       "    ('CKNN_12_15', 'CKNN_12_30'),\n",
       "    ('CKNN_12_15', 'CNON_12_30'),\n",
       "    ('CNON_12_15', 'CNON_12_30'),\n",
       "    ('C_NI_12_30', 'C_NI_12_45'),\n",
       "    ('CKNI_12_30', 'CKNI_12_45'),\n",
       "    ('CBODD_12_30', 'CBODD_12_45'),\n",
       "    ('CKND_12_30', 'CKNN_12_45'),\n",
       "    ('CKNN_12_30', 'CKNN_12_45'),\n",
       "    ('CKNN_12_30', 'CNON_12_45'),\n",
       "    ('CNON_12_30', 'CNON_12_45'),\n",
       "    ('CBODN_12_00', 'CBODN_12_15'),\n",
       "    ('CKNN_12_00', 'CKND_12_15'),\n",
       "    ('CKNN_12_00', 'CKNN_12_15'),\n",
       "    ('CKND_12_15', 'CKND_12_30'),\n",
       "    ('CBODN_12_15', 'CBODN_12_30'),\n",
       "    ('CKND_12_30', 'CKND_12_45'),\n",
       "    ('CBODN_12_30', 'CBODN_12_45'),\n",
       "    ('CBODN_12_00', 'CNON_12_15'),\n",
       "    ('CBODD_12_30', 'CBODN_12_45'),\n",
       "    ('CNON_12_00', 'CNON_12_15'),\n",
       "    ('C_NI_12_00', 'CBODD_12_15'),\n",
       "    ('CNON_12_00', 'CBODN_12_15'),\n",
       "    ('CNON_12_00', 'CNOD_12_15'),\n",
       "    ('CBODD_12_00', 'CBODN_12_15'),\n",
       "    ('CKND_12_15', 'CKNN_12_30'),\n",
       "    ('CNOD_12_00', 'CNOD_12_15'),\n",
       "    ('CNON_12_15', 'CNOD_12_30'),\n",
       "    ('CKNI_12_15', 'CKND_12_30'),\n",
       "    ('CKNI_12_30', 'CBODD_12_45'),\n",
       "    ('CNON_12_30', 'CNOD_12_45'),\n",
       "    ('CBODD_12_15', 'CBODN_12_30'),\n",
       "    ('CBODD_12_30', 'CNOD_12_45'),\n",
       "    ('CBODD_12_00', 'CNOD_12_15'),\n",
       "    ('CNOD_12_30', 'CNON_12_45'),\n",
       "    ('CNON_12_15', 'CBODN_12_30'),\n",
       "    ('CKNI_12_00', 'CKND_12_15'),\n",
       "    ('CNOD_12_00', 'CBODD_12_15'),\n",
       "    ('CNOD_12_15', 'CNON_12_30'),\n",
       "    ('CBODN_12_15', 'CNON_12_30'),\n",
       "    ('CKNN_12_15', 'CKND_12_30'),\n",
       "    ('CNOD_12_30', 'CBODD_12_45'),\n",
       "    ('CKNN_12_30', 'CKND_12_45'),\n",
       "    ('CNON_12_30', 'CBODN_12_45')],\n",
       "   'reversed_edges': [('CBODN_12_15', 'CBODN_12_00'),\n",
       "    ('CKND_12_30', 'CKND_12_15'),\n",
       "    ('CNOD_12_30', 'CNOD_12_15'),\n",
       "    ('CBODN_12_30', 'CBODN_12_15'),\n",
       "    ('CKND_12_45', 'CKND_12_30'),\n",
       "    ('CNOD_12_45', 'CNOD_12_30'),\n",
       "    ('CBODN_12_45', 'CBODN_12_30'),\n",
       "    ('CBODN_12_15', 'CBODD_12_00'),\n",
       "    ('CKND_12_45', 'CKNI_12_30'),\n",
       "    ('CKND_12_15', 'CKNI_12_00'),\n",
       "    ('CBODD_12_15', 'C_NI_12_00'),\n",
       "    ('CBODN_12_15', 'CNON_12_00'),\n",
       "    ('CBODD_12_30', 'C_NI_12_15'),\n",
       "    ('CNON_12_45', 'CNOD_12_30'),\n",
       "    ('CBODN_12_30', 'CNON_12_15')],\n",
       "   'indirect_paths': [('CKND_12_15', 'CKND_12_45'),\n",
       "    ('CNON_12_15', 'CNON_12_45'),\n",
       "    ('C_NI_12_00', 'CNOD_12_45'),\n",
       "    ('CKNI_12_00', 'CBODD_12_45'),\n",
       "    ('CBODD_12_00', 'CNOD_12_30'),\n",
       "    ('CBODN_12_00', 'CNON_12_45'),\n",
       "    ('CKNN_12_00', 'CBODN_12_30'),\n",
       "    ('CKNN_12_00', 'CNOD_12_45'),\n",
       "    ('CNON_12_00', 'CBODD_12_30'),\n",
       "    ('CNON_12_00', 'CNON_12_30'),\n",
       "    ('C_NI_12_15', 'CNOD_12_45'),\n",
       "    ('CKNN_12_15', 'CNOD_12_45')],\n",
       "   'reversed_indirect_paths': [('C_NI_12_30', 'C_NI_12_00')],\n",
       "   'no_connections': [('CKND_12_00', 'CNOD_12_15'),\n",
       "    ('CBODN_12_00', 'CNOD_12_15'),\n",
       "    ('CNOD_12_00', 'CBODN_12_15'),\n",
       "    ('CKNN_12_00', 'CBODN_12_15'),\n",
       "    ('CKND_12_00', 'CBODN_12_15'),\n",
       "    ('CKNN_12_00', 'CNOD_12_15'),\n",
       "    ('CBODD_12_00', 'CNON_12_15'),\n",
       "    ('CNON_12_30', 'CKND_12_45'),\n",
       "    ('C_NI_12_15', 'CBODN_12_30'),\n",
       "    ('CBODN_12_30', 'CKND_12_45'),\n",
       "    ('CNOD_12_00', 'CKND_12_15'),\n",
       "    ('CNON_12_00', 'CKND_12_15'),\n",
       "    ('CBODN_12_00', 'CKND_12_15'),\n",
       "    ('CKND_12_15', 'CBODD_12_00'),\n",
       "    ('CKND_12_15', 'CNOD_12_30'),\n",
       "    ('CNON_12_15', 'CKNN_12_30'),\n",
       "    ('CBODD_12_15', 'CKNI_12_30'),\n",
       "    ('CKND_12_30', 'CBODN_12_45'),\n",
       "    ('CBODD_12_00', 'CKND_12_15'),\n",
       "    ('CNOD_12_00', 'CKNN_12_15'),\n",
       "    ('CKNN_12_30', 'CNOD_12_45'),\n",
       "    ('CKND_12_00', 'CNON_12_15'),\n",
       "    ('CNON_12_15', 'CKND_12_30'),\n",
       "    ('CBODD_12_00', 'CKNI_12_15'),\n",
       "    ('CBODD_12_00', 'CKNN_12_30'),\n",
       "    ('CNON_12_00', 'CKNI_12_15'),\n",
       "    ('CNOD_12_15', 'CKNI_12_30'),\n",
       "    ('CBODN_12_15', 'CKNI_12_45'),\n",
       "    ('CKNN_12_15', 'C_NI_12_30'),\n",
       "    ('CKNN_12_15', 'CNOD_12_30'),\n",
       "    ('CBODD_12_30', 'CKNI_12_45'),\n",
       "    ('CNON_12_30', 'CKNN_12_45')],\n",
       "   'common_parents': [],\n",
       "   'common_childs': []},\n",
       "  'B': {'direct_edges': [('CBODN_12_30', 'CNON_12_45')],\n",
       "   'reversed_edges': [('CBODD_12_15', 'CKNI_12_00'),\n",
       "    ('CKNI_12_15', 'CKNI_12_00'),\n",
       "    ('CBODD_12_30', 'CBODD_12_15'),\n",
       "    ('C_NI_12_15', 'C_NI_12_00'),\n",
       "    ('CKNI_12_30', 'CKNI_12_15'),\n",
       "    ('CBODD_12_45', 'CBODD_12_30'),\n",
       "    ('CKNN_12_30', 'CKNN_12_15'),\n",
       "    ('CNON_12_15', 'CNON_12_00'),\n",
       "    ('CKNN_12_45', 'CKNN_12_30'),\n",
       "    ('CKND_12_15', 'CKND_12_00'),\n",
       "    ('CKND_12_30', 'CKNI_12_15'),\n",
       "    ('CNON_12_15', 'CNOD_12_00'),\n",
       "    ('CNON_12_30', 'CNON_12_15'),\n",
       "    ('CBODD_12_30', 'CKNI_12_15'),\n",
       "    ('C_NI_12_30', 'C_NI_12_15'),\n",
       "    ('CKNI_12_45', 'CKNI_12_30'),\n",
       "    ('CBODD_12_45', 'C_NI_12_30'),\n",
       "    ('CNON_12_45', 'CNON_12_30')],\n",
       "   'indirect_paths': [('CKNI_12_00', 'CKNI_12_45'),\n",
       "    ('CKNI_12_00', 'CKND_12_45'),\n",
       "    ('CBODD_12_00', 'CBODN_12_45'),\n",
       "    ('CBODN_12_00', 'CBODD_12_45'),\n",
       "    ('CNON_12_00', 'CNOD_12_45'),\n",
       "    ('C_NI_12_15', 'C_NI_12_45'),\n",
       "    ('CKNN_12_15', 'CBODN_12_45'),\n",
       "    ('CNON_12_15', 'CBODD_12_45'),\n",
       "    ('CNON_12_15', 'CNOD_12_45'),\n",
       "    ('CNON_12_15', 'CBODN_12_45')],\n",
       "   'reversed_indirect_paths': [('CNOD_12_30', 'CNON_12_00')],\n",
       "   'no_connections': [('CNON_12_15', 'CKNI_12_00'),\n",
       "    ('CKND_12_30', 'CNOD_12_00'),\n",
       "    ('CKND_12_15', 'CNOD_12_00'),\n",
       "    ('CNOD_12_00', 'CKNN_12_45'),\n",
       "    ('CNON_12_15', 'CKNN_12_45')],\n",
       "   'common_parents': [],\n",
       "   'common_childs': []},\n",
       "  'C': {'direct_edges': [],\n",
       "   'reversed_edges': [('CNOD_12_15', 'CBODD_12_00'),\n",
       "    ('CKND_12_45', 'CKNN_12_30'),\n",
       "    ('CNON_12_30', 'CNOD_12_15'),\n",
       "    ('CKND_12_30', 'CKNN_12_15')],\n",
       "   'indirect_paths': [('CNON_12_00', 'CNOD_12_45'),\n",
       "    ('CBODD_12_15', 'CBODN_12_45'),\n",
       "    ('CBODN_12_00', 'CNOD_12_45'),\n",
       "    ('CKND_12_00', 'CKND_12_30'),\n",
       "    ('CNOD_12_00', 'CNOD_12_45'),\n",
       "    ('CBODD_12_00', 'CNOD_12_45'),\n",
       "    ('CKNN_12_00', 'CNOD_12_45'),\n",
       "    ('CKNI_12_15', 'CBODD_12_45'),\n",
       "    ('CKNN_12_00', 'CNOD_12_30'),\n",
       "    ('CKND_12_00', 'CNOD_12_45'),\n",
       "    ('CNON_12_00', 'CNOD_12_30'),\n",
       "    ('CNOD_12_00', 'CNOD_12_30'),\n",
       "    ('CBODD_12_00', 'CNOD_12_30'),\n",
       "    ('CBODN_12_00', 'CNOD_12_30'),\n",
       "    ('CKNI_12_00', 'CKND_12_30'),\n",
       "    ('CKND_12_00', 'CKND_12_45'),\n",
       "    ('CKND_12_15', 'CKNN_12_45'),\n",
       "    ('CKNN_12_15', 'CKNN_12_45'),\n",
       "    ('CKNN_12_00', 'CKND_12_45'),\n",
       "    ('CKNN_12_00', 'CKND_12_30'),\n",
       "    ('CBODN_12_15', 'CNOD_12_45'),\n",
       "    ('CKNI_12_15', 'CKND_12_45'),\n",
       "    ('CKNN_12_00', 'CBODN_12_45'),\n",
       "    ('CKND_12_00', 'CBODN_12_45'),\n",
       "    ('CNON_12_15', 'CNOD_12_45'),\n",
       "    ('CBODD_12_15', 'CNOD_12_45'),\n",
       "    ('CKNI_12_00', 'CNOD_12_30')],\n",
       "   'reversed_indirect_paths': [('CBODD_12_30', 'C_NI_12_00'),\n",
       "    ('CKND_12_30', 'CKNI_12_00'),\n",
       "    ('CBODN_12_45', 'CBODN_12_15'),\n",
       "    ('CKND_12_30', 'CKNN_12_00'),\n",
       "    ('CBODD_12_45', 'C_NI_12_15'),\n",
       "    ('CBODD_12_45', 'C_NI_12_00'),\n",
       "    ('CBODN_12_30', 'CKNN_12_00'),\n",
       "    ('CKND_12_45', 'CKND_12_00'),\n",
       "    ('CNOD_12_45', 'CNOD_12_15'),\n",
       "    ('CKND_12_30', 'CKND_12_00'),\n",
       "    ('CBODN_12_30', 'CNON_12_00'),\n",
       "    ('CBODD_12_45', 'CKNI_12_15'),\n",
       "    ('CNON_12_45', 'CKNN_12_15'),\n",
       "    ('CBODN_12_45', 'CBODD_12_15'),\n",
       "    ('CBODD_12_30', 'CKNI_12_00'),\n",
       "    ('CKND_12_45', 'CKNN_12_15'),\n",
       "    ('CNON_12_45', 'CNOD_12_15')],\n",
       "   'no_connections': [('CNON_12_00', 'CBODD_12_00'),\n",
       "    ('CKND_12_00', 'CBODD_12_00'),\n",
       "    ('CKNN_12_00', 'CNOD_12_00'),\n",
       "    ('CKND_12_00', 'CBODN_12_00'),\n",
       "    ('CBODD_12_00', 'CBODN_12_00'),\n",
       "    ('CKNN_12_00', 'CBODD_12_00'),\n",
       "    ('CBODD_12_00', 'CNOD_12_00'),\n",
       "    ('CBODD_12_00', 'CNON_12_00'),\n",
       "    ('CNOD_12_00', 'CKND_12_30'),\n",
       "    ('CKND_12_30', 'CBODN_12_00'),\n",
       "    ('CKND_12_00', 'CNOD_12_30'),\n",
       "    ('CNON_12_15', 'CNOD_12_15'),\n",
       "    ('CKND_12_00', 'CKNN_12_00'),\n",
       "    ('CNON_12_00', 'CKND_12_45'),\n",
       "    ('CBODN_12_00', 'CKND_12_45'),\n",
       "    ('CNON_12_00', 'CKND_12_30'),\n",
       "    ('CNOD_12_00', 'CKND_12_45'),\n",
       "    ('CBODD_12_00', 'CKND_12_30'),\n",
       "    ('CBODD_12_00', 'CKND_12_45'),\n",
       "    ('CBODN_12_00', 'CKND_12_30'),\n",
       "    ('CKND_12_15', 'CNON_12_15'),\n",
       "    ('CKNI_12_45', 'CKND_12_45'),\n",
       "    ('CBODN_12_45', 'CKND_12_45'),\n",
       "    ('CNON_12_45', 'CNOD_12_45'),\n",
       "    ('CNON_12_15', 'CKNN_12_15'),\n",
       "    ('CBODD_12_30', 'CKNI_12_30'),\n",
       "    ('CBODD_12_15', 'CKNI_12_15'),\n",
       "    ('CBODD_12_45', 'CBODN_12_45'),\n",
       "    ('CKND_12_15', 'CKNN_12_15'),\n",
       "    ('CKND_12_30', 'CNOD_12_30'),\n",
       "    ('CKNN_12_30', 'CNOD_12_30'),\n",
       "    ('CNON_12_30', 'CKNN_12_30'),\n",
       "    ('CNON_12_30', 'CNOD_12_30'),\n",
       "    ('CBODD_12_15', 'C_NI_12_15'),\n",
       "    ('CKND_12_30', 'CBODD_12_00'),\n",
       "    ('CKND_12_30', 'CNON_12_00'),\n",
       "    ('CNON_12_15', 'CBODD_12_00'),\n",
       "    ('CBODN_12_15', 'CKNN_12_00'),\n",
       "    ('CKND_12_45', 'CBODN_12_30'),\n",
       "    ('CBODD_12_30', 'CNOD_12_30'),\n",
       "    ('CBODD_12_15', 'CKNN_12_00'),\n",
       "    ('CKND_12_30', 'CKNN_12_30')],\n",
       "   'common_parents': [('CNON_12_00', 'CBODD_12_00'),\n",
       "    ('CKNN_12_00', 'CNOD_12_00'),\n",
       "    ('CBODD_12_00', 'CBODN_12_00'),\n",
       "    ('CBODD_12_00', 'CNOD_12_00'),\n",
       "    ('CBODD_12_00', 'CNON_12_00'),\n",
       "    ('CNON_12_15', 'CNOD_12_15'),\n",
       "    ('CKND_12_00', 'CKNN_12_00'),\n",
       "    ('CNON_12_15', 'CKNN_12_15'),\n",
       "    ('CBODD_12_30', 'CKNI_12_30'),\n",
       "    ('CBODD_12_15', 'CKNI_12_15'),\n",
       "    ('CKND_12_15', 'CKNN_12_15'),\n",
       "    ('CKNN_12_30', 'CNOD_12_30'),\n",
       "    ('CNON_12_30', 'CKNN_12_30'),\n",
       "    ('CNON_12_30', 'CNOD_12_30'),\n",
       "    ('CBODD_12_15', 'C_NI_12_15'),\n",
       "    ('CBODD_12_30', 'CNOD_12_30'),\n",
       "    ('CKND_12_30', 'CKNN_12_30')],\n",
       "   'common_childs': [('CNON_12_00', 'CBODD_12_00'),\n",
       "    ('CKNN_12_00', 'CNOD_12_00'),\n",
       "    ('CBODD_12_00', 'CBODN_12_00'),\n",
       "    ('CBODD_12_00', 'CNOD_12_00'),\n",
       "    ('CBODD_12_00', 'CNON_12_00'),\n",
       "    ('CNON_12_15', 'CNOD_12_15'),\n",
       "    ('CKND_12_00', 'CKNN_12_00'),\n",
       "    ('CNON_12_15', 'CKNN_12_15'),\n",
       "    ('CBODD_12_30', 'CKNI_12_30'),\n",
       "    ('CBODD_12_15', 'CKNI_12_15'),\n",
       "    ('CKND_12_15', 'CKNN_12_15'),\n",
       "    ('CKNN_12_30', 'CNOD_12_30'),\n",
       "    ('CNON_12_30', 'CKNN_12_30'),\n",
       "    ('CNON_12_30', 'CNOD_12_30'),\n",
       "    ('CBODD_12_15', 'C_NI_12_15'),\n",
       "    ('CBODD_12_30', 'CNOD_12_30'),\n",
       "    ('CKND_12_30', 'CKNN_12_30')]}},\n",
       " 'barley': {'A': {'direct_edges': [('jordtype', 'potnmin'),\n",
       "    ('jordtype', 'exptgens'),\n",
       "    ('jordtype', 'rokap'),\n",
       "    ('nmin', 'jordn'),\n",
       "    ('nmin', 'mod_nmin'),\n",
       "    ('aar_mod', 'jordn'),\n",
       "    ('aar_mod', 'mod_nmin'),\n",
       "    ('forfrugt', 'ngodnt'),\n",
       "    ('potnmin', 'jordn'),\n",
       "    ('jordn', 'ngodnn'),\n",
       "    ('jordn', 'nprot'),\n",
       "    ('jordn', 'ntilg'),\n",
       "    ('exptgens', 'ngodnt'),\n",
       "    ('exptgens', 'nopt'),\n",
       "    ('mod_nmin', 'ngodnt'),\n",
       "    ('nopt', 'ngodnn'),\n",
       "    ('ngodn', 'nprot'),\n",
       "    ('ngodn', 'ngtilg'),\n",
       "    ('saatid', 'dg25'),\n",
       "    ('saatid', 'frspdag'),\n",
       "    ('sort', 'srtprot'),\n",
       "    ('sort', 'sorttkv'),\n",
       "    ('nplac', 'ngtilg'),\n",
       "    ('saamng', 'saakern'),\n",
       "    ('saakern', 'antplnt'),\n",
       "    ('partigerm', 'markgrm'),\n",
       "    ('frspdag', 'jordinf'),\n",
       "    ('jordinf', 'markgrm'),\n",
       "    ('markgrm', 'antplnt'),\n",
       "    ('aks_m2', 'udb'),\n",
       "    ('aks_vgt', 'udb'),\n",
       "    ('jordtype', 'nmin'),\n",
       "    ('forfrugt', 'potnmin'),\n",
       "    ('sort', 'srtsize'),\n",
       "    ('nedbarea', 'nmin'),\n",
       "    ('keraks', 'ksort'),\n",
       "    ('aks_vgt', 'ksort'),\n",
       "    ('nprot', 'protein'),\n",
       "    ('forfrugt', 'exptgens'),\n",
       "    ('srtprot', 'protein'),\n",
       "    ('ntilg', 'aks_m2'),\n",
       "    ('jordtype', 'aar_mod'),\n",
       "    ('ntilg', 'keraks'),\n",
       "    ('tkvs', 'saakern')],\n",
       "   'reversed_edges': [('nmin', 'jordtype'),\n",
       "    ('nmin', 'nedbarea'),\n",
       "    ('potnmin', 'forfrugt'),\n",
       "    ('srtsize', 'sort'),\n",
       "    ('jordn', 'nmin'),\n",
       "    ('mod_nmin', 'aar_mod'),\n",
       "    ('nopt', 'exptgens'),\n",
       "    ('saakern', 'tkvs'),\n",
       "    ('antplnt', 'saakern'),\n",
       "    ('antplnt', 'markgrm'),\n",
       "    ('aks_vgt', 'aks_m2'),\n",
       "    ('jordn', 'potnmin'),\n",
       "    ('jordinf', 'frspdag'),\n",
       "    ('aks_m2', 'antplnt'),\n",
       "    ('exptgens', 'forfrugt'),\n",
       "    ('ngodnn', 'nopt'),\n",
       "    ('ngtilg', 'ngodn'),\n",
       "    ('ngodn', 'ngodnt'),\n",
       "    ('protein', 'srtprot'),\n",
       "    ('nopt', 'pesticid'),\n",
       "    ('ngtilg', 'dg25'),\n",
       "    ('jordn', 'aar_mod'),\n",
       "    ('ngodnt', 'exptgens'),\n",
       "    ('aks_m2', 'sorttkv'),\n",
       "    ('potnmin', 'jordtype')],\n",
       "   'indirect_paths': [('jordtype', 'mod_nmin'),\n",
       "    ('pesticid', 'ngodn'),\n",
       "    ('nmin', 'ngodnn'),\n",
       "    ('nopt', 'nprot'),\n",
       "    ('jordtype', 'nprot'),\n",
       "    ('nmin', 'nprot'),\n",
       "    ('mod_nmin', 'nprot'),\n",
       "    ('ntilg', 'udb'),\n",
       "    ('forfrugt', 'jordn'),\n",
       "    ('jordn', 'ngodn'),\n",
       "    ('nopt', 'ngodn'),\n",
       "    ('nmin', 'aks_m2'),\n",
       "    ('mod_nmin', 'ngodn'),\n",
       "    ('nmin', 'ngodn'),\n",
       "    ('nmin', 'ngtilg'),\n",
       "    ('rokap', 'keraks'),\n",
       "    ('potnmin', 'nprot'),\n",
       "    ('nplac', 'udb'),\n",
       "    ('nmin', 'ngodnt'),\n",
       "    ('saamng', 'antplnt'),\n",
       "    ('jordtype', 'jordn'),\n",
       "    ('jordn', 'ngtilg'),\n",
       "    ('ngodnn', 'ntilg'),\n",
       "    ('frspdag', 'markgrm'),\n",
       "    ('rokap', 'ksort'),\n",
       "    ('saatid', 'jordinf'),\n",
       "    ('ngodnn', 'ngtilg'),\n",
       "    ('potnmin', 'ngodnn'),\n",
       "    ('saatid', 'ksort'),\n",
       "    ('nopt', 'ntilg'),\n",
       "    ('nopt', 'keraks'),\n",
       "    ('jordinf', 'antplnt'),\n",
       "    ('nplac', 'ntilg'),\n",
       "    ('rokap', 'aks_m2'),\n",
       "    ('nmin', 'keraks'),\n",
       "    ('nmin', 'ntilg'),\n",
       "    ('exptgens', 'ngodnn'),\n",
       "    ('forfrugt', 'nprot'),\n",
       "    ('aks_m2', 'ksort'),\n",
       "    ('ngodnt', 'ngtilg'),\n",
       "    ('jordn', 'protein'),\n",
       "    ('jordn', 'aks_m2'),\n",
       "    ('jordtype', 'ngodnt'),\n",
       "    ('nedbarea', 'ksort'),\n",
       "    ('aar_mod', 'ngtilg'),\n",
       "    ('nplac', 'protein'),\n",
       "    ('frspdag', 'ksort')],\n",
       "   'reversed_indirect_paths': [('ngodn', 'jordn'),\n",
       "    ('aks_m2', 'nmin'),\n",
       "    ('ntilg', 'nplac'),\n",
       "    ('aks_m2', 'saakern'),\n",
       "    ('nprot', 'jordtype'),\n",
       "    ('ngtilg', 'ngodnn'),\n",
       "    ('ngodn', 'aar_mod'),\n",
       "    ('udb', 'nplac'),\n",
       "    ('antplnt', 'tkvs'),\n",
       "    ('ksort', 'saatid'),\n",
       "    ('antplnt', 'partigerm'),\n",
       "    ('udb', 'jordn'),\n",
       "    ('keraks', 'ngodn'),\n",
       "    ('antplnt', 'jordinf'),\n",
       "    ('ksort', 'aks_m2'),\n",
       "    ('udb', 'ntilg'),\n",
       "    ('ngodn', 'exptgens'),\n",
       "    ('ngodn', 'nopt'),\n",
       "    ('aks_vgt', 'saakern'),\n",
       "    ('udb', 'ngodn'),\n",
       "    ('ntilg', 'dg25'),\n",
       "    ('keraks', 'rokap'),\n",
       "    ('keraks', 'exptgens'),\n",
       "    ('nprot', 'ngodnt')],\n",
       "   'no_connections': [('nmin', 'aar_mod'),\n",
       "    ('saamng', 'tkvs'),\n",
       "    ('jordinf', 'partigerm'),\n",
       "    ('nmin', 'potnmin'),\n",
       "    ('pesticid', 'mod_nmin'),\n",
       "    ('pesticid', 'saakern'),\n",
       "    ('pesticid', 'antplnt'),\n",
       "    ('jordtype', 'forfrugt'),\n",
       "    ('mod_nmin', 'potnmin'),\n",
       "    ('saakern', 'markgrm'),\n",
       "    ('aks_vgt', 'keraks'),\n",
       "    ('potnmin', 'mod_nmin'),\n",
       "    ('jordn', 'mod_nmin'),\n",
       "    ('mod_nmin', 'forfrugt'),\n",
       "    ('jordn', 'nopt'),\n",
       "    ('exptgens', 'mod_nmin'),\n",
       "    ('jordtype', 'nedbarea'),\n",
       "    ('potnmin', 'nmin'),\n",
       "    ('forfrugt', 'mod_nmin'),\n",
       "    ('aar_mod', 'potnmin'),\n",
       "    ('saatid', 'rokap'),\n",
       "    ('rokap', 'nprot'),\n",
       "    ('srtsize', 'aks_vgt'),\n",
       "    ('ngodn', 'dg25'),\n",
       "    ('exptgens', 'jordn'),\n",
       "    ('nmin', 'exptgens'),\n",
       "    ('nmin', 'rokap'),\n",
       "    ('potnmin', 'aar_mod'),\n",
       "    ('exptgens', 'rokap'),\n",
       "    ('srtsize', 'srtprot'),\n",
       "    ('nopt', 'rokap'),\n",
       "    ('nprot', 'udb'),\n",
       "    ('aar_mod', 'nmin'),\n",
       "    ('rokap', 'exptgens'),\n",
       "    ('nmin', 'forfrugt'),\n",
       "    ('mod_nmin', 'exptgens'),\n",
       "    ('exptgens', 'nmin'),\n",
       "    ('saatid', 'jordtype'),\n",
       "    ('jordn', 'ngodnt'),\n",
       "    ('ksort', 'udb'),\n",
       "    ('saamng', 'markgrm'),\n",
       "    ('srtsize', 'sorttkv'),\n",
       "    ('ngtilg', 'nprot'),\n",
       "    ('jordn', 'exptgens'),\n",
       "    ('nprot', 'aks_m2'),\n",
       "    ('nopt', 'mod_nmin'),\n",
       "    ('forfrugt', 'jordtype'),\n",
       "    ('ntilg', 'nprot'),\n",
       "    ('saamng', 'partigerm'),\n",
       "    ('mod_nmin', 'ngodnn'),\n",
       "    ('srtsize', 'keraks'),\n",
       "    ('nprot', 'ngtilg'),\n",
       "    ('exptgens', 'potnmin'),\n",
       "    ('mod_nmin', 'nopt'),\n",
       "    ('nplac', 'ngodnn'),\n",
       "    ('nmin', 'nopt'),\n",
       "    ('srtprot', 'srtsize'),\n",
       "    ('partigerm', 'frspdag'),\n",
       "    ('nedbarea', 'srtprot'),\n",
       "    ('pesticid', 'saakern'),\n",
       "    ('nopt', 'antplnt'),\n",
       "    ('rokap', 'markgrm')],\n",
       "   'common_parents': [('nmin', 'aar_mod'),\n",
       "    ('saamng', 'tkvs'),\n",
       "    ('jordinf', 'partigerm'),\n",
       "    ('nmin', 'potnmin'),\n",
       "    ('jordtype', 'forfrugt'),\n",
       "    ('saakern', 'markgrm'),\n",
       "    ('aks_vgt', 'keraks'),\n",
       "    ('mod_nmin', 'forfrugt'),\n",
       "    ('jordn', 'nopt'),\n",
       "    ('exptgens', 'mod_nmin'),\n",
       "    ('jordtype', 'nedbarea'),\n",
       "    ('potnmin', 'nmin'),\n",
       "    ('forfrugt', 'mod_nmin'),\n",
       "    ('aar_mod', 'potnmin'),\n",
       "    ('saatid', 'rokap'),\n",
       "    ('srtsize', 'aks_vgt'),\n",
       "    ('ngodn', 'dg25'),\n",
       "    ('potnmin', 'aar_mod'),\n",
       "    ('aar_mod', 'nmin'),\n",
       "    ('mod_nmin', 'exptgens'),\n",
       "    ('forfrugt', 'jordtype'),\n",
       "    ('srtsize', 'keraks')],\n",
       "   'common_childs': [('nmin', 'aar_mod'),\n",
       "    ('saamng', 'tkvs'),\n",
       "    ('jordinf', 'partigerm'),\n",
       "    ('nmin', 'potnmin'),\n",
       "    ('jordtype', 'forfrugt'),\n",
       "    ('saakern', 'markgrm'),\n",
       "    ('aks_vgt', 'keraks'),\n",
       "    ('mod_nmin', 'forfrugt'),\n",
       "    ('jordn', 'nopt'),\n",
       "    ('exptgens', 'mod_nmin'),\n",
       "    ('jordtype', 'nedbarea'),\n",
       "    ('potnmin', 'nmin'),\n",
       "    ('forfrugt', 'mod_nmin'),\n",
       "    ('aar_mod', 'potnmin'),\n",
       "    ('saatid', 'rokap'),\n",
       "    ('srtsize', 'aks_vgt'),\n",
       "    ('ngodn', 'dg25'),\n",
       "    ('potnmin', 'aar_mod'),\n",
       "    ('aar_mod', 'nmin'),\n",
       "    ('mod_nmin', 'exptgens'),\n",
       "    ('forfrugt', 'jordtype'),\n",
       "    ('srtsize', 'keraks')]},\n",
       "  'B': {'direct_edges': [('ntilg', 'aks_vgt'), ('pesticid', 'nopt')],\n",
       "   'reversed_edges': [('exptgens', 'jordtype'),\n",
       "    ('srtprot', 'sort'),\n",
       "    ('saakern', 'saamng'),\n",
       "    ('frspdag', 'saatid'),\n",
       "    ('markgrm', 'partigerm'),\n",
       "    ('markgrm', 'jordinf'),\n",
       "    ('udb', 'aks_m2'),\n",
       "    ('udb', 'aks_vgt'),\n",
       "    ('rokap', 'jordtype'),\n",
       "    ('ngtilg', 'nplac'),\n",
       "    ('ngodnn', 'jordn'),\n",
       "    ('ngodnt', 'forfrugt'),\n",
       "    ('mod_nmin', 'nmin'),\n",
       "    ('ksort', 'aks_vgt'),\n",
       "    ('sorttkv', 'sort'),\n",
       "    ('ngodnt', 'mod_nmin'),\n",
       "    ('dg25', 'saatid'),\n",
       "    ('ntilg', 'jordn')],\n",
       "   'indirect_paths': [('exptgens', 'aks_m2'),\n",
       "    ('komm', 'jordn'),\n",
       "    ('komm', 'aks_m2'),\n",
       "    ('pesticid', 'keraks'),\n",
       "    ('pesticid', 'ksort'),\n",
       "    ('partigerm', 'udb'),\n",
       "    ('jordinf', 'aks_vgt')],\n",
       "   'reversed_indirect_paths': [('ngodn', 'mod_nmin'),\n",
       "    ('aks_m2', 'saatid'),\n",
       "    ('ngodn', 'jordtype'),\n",
       "    ('aks_m2', 'saamng'),\n",
       "    ('keraks', 'jordtype'),\n",
       "    ('antplnt', 'saamng'),\n",
       "    ('keraks', 'potnmin'),\n",
       "    ('nopt', 'jordtype'),\n",
       "    ('ngodn', 'nmin'),\n",
       "    ('ngodnt', 'nmin'),\n",
       "    ('ngodn', 'forfrugt'),\n",
       "    ('nprot', 'potnmin'),\n",
       "    ('nprot', 'nmin'),\n",
       "    ('ngodnn', 'nmin'),\n",
       "    ('ngtilg', 'jordn'),\n",
       "    ('ngtilg', 'nopt'),\n",
       "    ('jordinf', 'saatid'),\n",
       "    ('keraks', 'jordn'),\n",
       "    ('jordn', 'jordtype'),\n",
       "    ('keraks', 'nmin'),\n",
       "    ('ngodnn', 'exptgens'),\n",
       "    ('nprot', 'exptgens'),\n",
       "    ('ngodnn', 'jordtype'),\n",
       "    ('ngodnt', 'nedbarea'),\n",
       "    ('keraks', 'nopt'),\n",
       "    ('ntilg', 'nopt'),\n",
       "    ('udb', 'mod_nmin'),\n",
       "    ('udb', 'nopt'),\n",
       "    ('udb', 'potnmin'),\n",
       "    ('ngtilg', 'mod_nmin'),\n",
       "    ('ksort', 'jordtype'),\n",
       "    ('ntilg', 'potnmin'),\n",
       "    ('ntilg', 'mod_nmin'),\n",
       "    ('protein', 'ngtilg'),\n",
       "    ('keraks', 'mod_nmin'),\n",
       "    ('udb', 'exptgens')],\n",
       "   'no_connections': [('ngodn', 'nplac'),\n",
       "    ('partigerm', 'jordinf'),\n",
       "    ('keraks', 'aks_vgt'),\n",
       "    ('nopt', 'jordn'),\n",
       "    ('ngodn', 'rokap'),\n",
       "    ('exptgens', 'aar_mod'),\n",
       "    ('rokap', 'saatid'),\n",
       "    ('saakern', 'partigerm'),\n",
       "    ('saakern', 'jordinf'),\n",
       "    ('nprot', 'nplac'),\n",
       "    ('nopt', 'potnmin'),\n",
       "    ('nopt', 'nplac'),\n",
       "    ('ngodnt', 'nopt'),\n",
       "    ('ngodnt', 'nplac'),\n",
       "    ('keraks', 'srtsize'),\n",
       "    ('jordtype', 'nedbarea'),\n",
       "    ('nmin', 'saatid'),\n",
       "    ('potnmin', 'jordinf'),\n",
       "    ('jordn', 'pesticid'),\n",
       "    ('ngodnn', 'jordinf'),\n",
       "    ('nprot', 'saatid')],\n",
       "   'common_parents': [('ngodn', 'nplac'),\n",
       "    ('partigerm', 'jordinf'),\n",
       "    ('keraks', 'aks_vgt'),\n",
       "    ('nopt', 'jordn'),\n",
       "    ('rokap', 'saatid'),\n",
       "    ('keraks', 'srtsize'),\n",
       "    ('jordtype', 'nedbarea')],\n",
       "   'common_childs': [('ngodn', 'nplac'),\n",
       "    ('partigerm', 'jordinf'),\n",
       "    ('keraks', 'aks_vgt'),\n",
       "    ('nopt', 'jordn'),\n",
       "    ('rokap', 'saatid'),\n",
       "    ('keraks', 'srtsize'),\n",
       "    ('jordtype', 'nedbarea')]},\n",
       "  'C': {'direct_edges': [('pesticid', 'nopt')],\n",
       "   'reversed_edges': [],\n",
       "   'indirect_paths': [],\n",
       "   'reversed_indirect_paths': [],\n",
       "   'no_connections': [],\n",
       "   'common_parents': [],\n",
       "   'common_childs': []}}}"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "answer_type_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'alarm': {'A': {'direct_edges': 44,\n",
       "   'reversed_edges': 2,\n",
       "   'indirect_paths': 37,\n",
       "   'reversed_indirect_paths': 0,\n",
       "   'no_connections': 49,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 7},\n",
       "  'B': {'direct_edges': 1,\n",
       "   'reversed_edges': 22,\n",
       "   'indirect_paths': 6,\n",
       "   'reversed_indirect_paths': 11,\n",
       "   'no_connections': 21,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 3},\n",
       "  'C': {'direct_edges': 0,\n",
       "   'reversed_edges': 0,\n",
       "   'indirect_paths': 0,\n",
       "   'reversed_indirect_paths': 3,\n",
       "   'no_connections': 88,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 6}},\n",
       " 'asia': {'A': {'direct_edges': 8,\n",
       "   'reversed_edges': 0,\n",
       "   'indirect_paths': 9,\n",
       "   'reversed_indirect_paths': 0,\n",
       "   'no_connections': 1,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 0},\n",
       "  'B': {'direct_edges': 0,\n",
       "   'reversed_edges': 7,\n",
       "   'indirect_paths': 0,\n",
       "   'reversed_indirect_paths': 5,\n",
       "   'no_connections': 2,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 0},\n",
       "  'C': {'direct_edges': 0,\n",
       "   'reversed_edges': 0,\n",
       "   'indirect_paths': 0,\n",
       "   'reversed_indirect_paths': 0,\n",
       "   'no_connections': 12,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 3}},\n",
       " 'insurance': {'A': {'direct_edges': 48,\n",
       "   'reversed_edges': 6,\n",
       "   'indirect_paths': 38,\n",
       "   'reversed_indirect_paths': 7,\n",
       "   'no_connections': 18,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 5},\n",
       "  'B': {'direct_edges': 1,\n",
       "   'reversed_edges': 24,\n",
       "   'indirect_paths': 1,\n",
       "   'reversed_indirect_paths': 4,\n",
       "   'no_connections': 11,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 2},\n",
       "  'C': {'direct_edges': 1,\n",
       "   'reversed_edges': 2,\n",
       "   'indirect_paths': 0,\n",
       "   'reversed_indirect_paths': 4,\n",
       "   'no_connections': 33,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 5}},\n",
       " 'mildew': {'A': {'direct_edges': 45,\n",
       "   'reversed_edges': 4,\n",
       "   'indirect_paths': 36,\n",
       "   'reversed_indirect_paths': 3,\n",
       "   'no_connections': 11,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 6},\n",
       "  'B': {'direct_edges': 1,\n",
       "   'reversed_edges': 34,\n",
       "   'indirect_paths': 0,\n",
       "   'reversed_indirect_paths': 10,\n",
       "   'no_connections': 24,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 7},\n",
       "  'C': {'direct_edges': 0,\n",
       "   'reversed_edges': 1,\n",
       "   'indirect_paths': 42,\n",
       "   'reversed_indirect_paths': 48,\n",
       "   'no_connections': 42,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 22}},\n",
       " 'child': {'A': {'direct_edges': 25,\n",
       "   'reversed_edges': 1,\n",
       "   'indirect_paths': 14,\n",
       "   'reversed_indirect_paths': 2,\n",
       "   'no_connections': 12,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 2},\n",
       "  'B': {'direct_edges': 0,\n",
       "   'reversed_edges': 15,\n",
       "   'indirect_paths': 8,\n",
       "   'reversed_indirect_paths': 4,\n",
       "   'no_connections': 6,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 0},\n",
       "  'C': {'direct_edges': 0,\n",
       "   'reversed_edges': 2,\n",
       "   'indirect_paths': 0,\n",
       "   'reversed_indirect_paths': 2,\n",
       "   'no_connections': 15,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 0}},\n",
       " 'cancer': {'A': {'direct_edges': 4,\n",
       "   'reversed_edges': 1,\n",
       "   'indirect_paths': 4,\n",
       "   'reversed_indirect_paths': 1,\n",
       "   'no_connections': 1,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 0},\n",
       "  'B': {'direct_edges': 0,\n",
       "   'reversed_edges': 3,\n",
       "   'indirect_paths': 0,\n",
       "   'reversed_indirect_paths': 0,\n",
       "   'no_connections': 2,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 1},\n",
       "  'C': {'direct_edges': 0,\n",
       "   'reversed_edges': 0,\n",
       "   'indirect_paths': 0,\n",
       "   'reversed_indirect_paths': 0,\n",
       "   'no_connections': 0,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 0}},\n",
       " 'water': {'A': {'direct_edges': 53,\n",
       "   'reversed_edges': 15,\n",
       "   'indirect_paths': 12,\n",
       "   'reversed_indirect_paths': 1,\n",
       "   'no_connections': 32,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 0},\n",
       "  'B': {'direct_edges': 1,\n",
       "   'reversed_edges': 18,\n",
       "   'indirect_paths': 10,\n",
       "   'reversed_indirect_paths': 1,\n",
       "   'no_connections': 5,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 0},\n",
       "  'C': {'direct_edges': 0,\n",
       "   'reversed_edges': 4,\n",
       "   'indirect_paths': 27,\n",
       "   'reversed_indirect_paths': 17,\n",
       "   'no_connections': 42,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 17}},\n",
       " 'barley': {'A': {'direct_edges': 44,\n",
       "   'reversed_edges': 25,\n",
       "   'indirect_paths': 47,\n",
       "   'reversed_indirect_paths': 24,\n",
       "   'no_connections': 62,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 22},\n",
       "  'B': {'direct_edges': 2,\n",
       "   'reversed_edges': 18,\n",
       "   'indirect_paths': 7,\n",
       "   'reversed_indirect_paths': 36,\n",
       "   'no_connections': 21,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 7},\n",
       "  'C': {'direct_edges': 1,\n",
       "   'reversed_edges': 0,\n",
       "   'indirect_paths': 0,\n",
       "   'reversed_indirect_paths': 0,\n",
       "   'no_connections': 0,\n",
       "   'common_parents': 0,\n",
       "   'common_childs': 0}}}"
      ]
     },
     "execution_count": 27,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# calculate the number of lists in answer_type_dict\n",
    "answer_type_num = {d:{k:{\"direct_edges\":0,\"reversed_edges\":0,\"indirect_paths\":0,\"reversed_indirect_paths\":0,\"no_connections\":0, \"common_parents\":0, \"common_childs\":0} for k in [\"A\",\"B\",\"C\"]} for d in datasets}\n",
    "for d in datasets:\n",
    "    for k in answer_type_dict[d]:\n",
    "        for kk in answer_type_dict[d][k]:\n",
    "            answer_type_num[d][k][kk] = len(answer_type_dict[d][k][kk])\n",
    "answer_type_num"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'alarm': {'A': {'direct_edges': 0.3333333333333333,\n",
       "   'reversed_edges': 0.015151515151515152,\n",
       "   'indirect_paths': 0.2803030303030303,\n",
       "   'reversed_indirect_paths': 0.0,\n",
       "   'no_connections': 0.3712121212121212,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.05303030303030303},\n",
       "  'B': {'direct_edges': 0.01639344262295082,\n",
       "   'reversed_edges': 0.36065573770491804,\n",
       "   'indirect_paths': 0.09836065573770492,\n",
       "   'reversed_indirect_paths': 0.18032786885245902,\n",
       "   'no_connections': 0.3442622950819672,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.04918032786885246},\n",
       "  'C': {'direct_edges': 0.0,\n",
       "   'reversed_edges': 0.0,\n",
       "   'indirect_paths': 0.0,\n",
       "   'reversed_indirect_paths': 0.03296703296703297,\n",
       "   'no_connections': 0.967032967032967,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.06593406593406594}},\n",
       " 'asia': {'A': {'direct_edges': 0.4444444444444444,\n",
       "   'reversed_edges': 0.0,\n",
       "   'indirect_paths': 0.5,\n",
       "   'reversed_indirect_paths': 0.0,\n",
       "   'no_connections': 0.05555555555555555,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.0},\n",
       "  'B': {'direct_edges': 0.0,\n",
       "   'reversed_edges': 0.5,\n",
       "   'indirect_paths': 0.0,\n",
       "   'reversed_indirect_paths': 0.35714285714285715,\n",
       "   'no_connections': 0.14285714285714285,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.0},\n",
       "  'C': {'direct_edges': 0.0,\n",
       "   'reversed_edges': 0.0,\n",
       "   'indirect_paths': 0.0,\n",
       "   'reversed_indirect_paths': 0.0,\n",
       "   'no_connections': 1.0,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.25}},\n",
       " 'insurance': {'A': {'direct_edges': 0.41025641025641024,\n",
       "   'reversed_edges': 0.05128205128205128,\n",
       "   'indirect_paths': 0.3247863247863248,\n",
       "   'reversed_indirect_paths': 0.05982905982905983,\n",
       "   'no_connections': 0.15384615384615385,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.042735042735042736},\n",
       "  'B': {'direct_edges': 0.024390243902439025,\n",
       "   'reversed_edges': 0.5853658536585366,\n",
       "   'indirect_paths': 0.024390243902439025,\n",
       "   'reversed_indirect_paths': 0.0975609756097561,\n",
       "   'no_connections': 0.2682926829268293,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.04878048780487805},\n",
       "  'C': {'direct_edges': 0.025,\n",
       "   'reversed_edges': 0.05,\n",
       "   'indirect_paths': 0.0,\n",
       "   'reversed_indirect_paths': 0.1,\n",
       "   'no_connections': 0.825,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.125}},\n",
       " 'mildew': {'A': {'direct_edges': 0.45454545454545453,\n",
       "   'reversed_edges': 0.04040404040404041,\n",
       "   'indirect_paths': 0.36363636363636365,\n",
       "   'reversed_indirect_paths': 0.030303030303030304,\n",
       "   'no_connections': 0.1111111111111111,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.06060606060606061},\n",
       "  'B': {'direct_edges': 0.014492753623188406,\n",
       "   'reversed_edges': 0.4927536231884058,\n",
       "   'indirect_paths': 0.0,\n",
       "   'reversed_indirect_paths': 0.14492753623188406,\n",
       "   'no_connections': 0.34782608695652173,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.10144927536231885},\n",
       "  'C': {'direct_edges': 0.0,\n",
       "   'reversed_edges': 0.007518796992481203,\n",
       "   'indirect_paths': 0.3157894736842105,\n",
       "   'reversed_indirect_paths': 0.3609022556390977,\n",
       "   'no_connections': 0.3157894736842105,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.16541353383458646}},\n",
       " 'child': {'A': {'direct_edges': 0.46296296296296297,\n",
       "   'reversed_edges': 0.018518518518518517,\n",
       "   'indirect_paths': 0.25925925925925924,\n",
       "   'reversed_indirect_paths': 0.037037037037037035,\n",
       "   'no_connections': 0.2222222222222222,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.037037037037037035},\n",
       "  'B': {'direct_edges': 0.0,\n",
       "   'reversed_edges': 0.45454545454545453,\n",
       "   'indirect_paths': 0.24242424242424243,\n",
       "   'reversed_indirect_paths': 0.12121212121212122,\n",
       "   'no_connections': 0.18181818181818182,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.0},\n",
       "  'C': {'direct_edges': 0.0,\n",
       "   'reversed_edges': 0.10526315789473684,\n",
       "   'indirect_paths': 0.0,\n",
       "   'reversed_indirect_paths': 0.10526315789473684,\n",
       "   'no_connections': 0.7894736842105263,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.0}},\n",
       " 'cancer': {'A': {'direct_edges': 0.36363636363636365,\n",
       "   'reversed_edges': 0.09090909090909091,\n",
       "   'indirect_paths': 0.36363636363636365,\n",
       "   'reversed_indirect_paths': 0.09090909090909091,\n",
       "   'no_connections': 0.09090909090909091,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.0},\n",
       "  'B': {'direct_edges': 0.0,\n",
       "   'reversed_edges': 0.6,\n",
       "   'indirect_paths': 0.0,\n",
       "   'reversed_indirect_paths': 0.0,\n",
       "   'no_connections': 0.4,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.2},\n",
       "  'C': {'direct_edges': inf,\n",
       "   'reversed_edges': inf,\n",
       "   'indirect_paths': inf,\n",
       "   'reversed_indirect_paths': inf,\n",
       "   'no_connections': inf,\n",
       "   'common_parents': inf,\n",
       "   'common_childs': inf}},\n",
       " 'water': {'A': {'direct_edges': 0.4690265486725664,\n",
       "   'reversed_edges': 0.13274336283185842,\n",
       "   'indirect_paths': 0.10619469026548672,\n",
       "   'reversed_indirect_paths': 0.008849557522123894,\n",
       "   'no_connections': 0.2831858407079646,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.0},\n",
       "  'B': {'direct_edges': 0.02857142857142857,\n",
       "   'reversed_edges': 0.5142857142857142,\n",
       "   'indirect_paths': 0.2857142857142857,\n",
       "   'reversed_indirect_paths': 0.02857142857142857,\n",
       "   'no_connections': 0.14285714285714285,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.0},\n",
       "  'C': {'direct_edges': 0.0,\n",
       "   'reversed_edges': 0.044444444444444446,\n",
       "   'indirect_paths': 0.3,\n",
       "   'reversed_indirect_paths': 0.18888888888888888,\n",
       "   'no_connections': 0.4666666666666667,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.18888888888888888}},\n",
       " 'barley': {'A': {'direct_edges': 0.21782178217821782,\n",
       "   'reversed_edges': 0.12376237623762376,\n",
       "   'indirect_paths': 0.23267326732673269,\n",
       "   'reversed_indirect_paths': 0.1188118811881188,\n",
       "   'no_connections': 0.3069306930693069,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.10891089108910891},\n",
       "  'B': {'direct_edges': 0.023809523809523808,\n",
       "   'reversed_edges': 0.21428571428571427,\n",
       "   'indirect_paths': 0.08333333333333333,\n",
       "   'reversed_indirect_paths': 0.42857142857142855,\n",
       "   'no_connections': 0.25,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.08333333333333333},\n",
       "  'C': {'direct_edges': 1.0,\n",
       "   'reversed_edges': 0.0,\n",
       "   'indirect_paths': 0.0,\n",
       "   'reversed_indirect_paths': 0.0,\n",
       "   'no_connections': 0.0,\n",
       "   'common_parents': 0.0,\n",
       "   'common_childs': 0.0}}}"
      ]
     },
     "execution_count": 28,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# calculate the ratio of each type of real structures of each anwer for each dataset\n",
    "# the total number is direct_edges + reversed_edges + indirect_paths + reversed_indirect_paths + no_connections\n",
    "# if total number is 0, then the ratio is inf\n",
    "answer_type_ratio = {d:{k:{\"direct_edges\":0,\"reversed_edges\":0,\"indirect_paths\":0,\"reversed_indirect_paths\":0,\"no_connections\":0, \"common_parents\":0, \"common_childs\":0} for k in [\"A\",\"B\",\"C\"]} for d in datasets}\n",
    "for d in datasets:\n",
    "    for k in answer_type_dict[d]:\n",
    "        valid_keys = [\"direct_edges\",\"reversed_edges\",\"indirect_paths\",\"reversed_indirect_paths\",\"no_connections\"]\n",
    "        total_num = 0\n",
    "        for key in valid_keys:\n",
    "            total_num += answer_type_num[d][k][key]\n",
    "        if total_num == 0:\n",
    "            answer_type_ratio[d][k] = {\"direct_edges\":np.inf,\"reversed_edges\":np.inf,\"indirect_paths\":np.inf,\"reversed_indirect_paths\":np.inf,\"no_connections\":np.inf, \"common_parents\":np.inf, \"common_childs\":np.inf}\n",
    "            continue\n",
    "        for kk in answer_type_dict[d][k]:\n",
    "            answer_type_ratio[d][k][kk] = answer_type_num[d][k][kk] / total_num\n",
    "answer_type_ratio"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "# #print answer_type_ratio in a table, \n",
    "# answer_type_ratio_df = pd.DataFrame(answer_type_ratio)\n",
    "# answer_type_ratio_df\n",
    "# take the ratio of different structures as a column in a dataframe\n",
    "answer_type_ratio_df = pd.DataFrame(answer_type_ratio)\n",
    "answer_type_ratio_df = answer_type_ratio_df.stack().reset_index()\n",
    "# the colum 0 is a dict of the ratio of different structures, we need to expand it to different columns\n",
    "answer_type_ratio_df = pd.concat([answer_type_ratio_df.drop([0], axis=1), answer_type_ratio_df[0].apply(pd.Series)], axis=1)\n",
    "#save the dataframe to a csv file\n",
    "answer_type_ratio_df.to_csv(\"out/answer_type_ratio.csv\", index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'A': {'direct_edges': 271,\n",
       "  'reversed_edges': 54,\n",
       "  'indirect_paths': 197,\n",
       "  'reversed_indirect_paths': 38,\n",
       "  'no_connections': 186,\n",
       "  'common_parents': 42,\n",
       "  'common_childs': 42},\n",
       " 'B': {'direct_edges': 6,\n",
       "  'reversed_edges': 141,\n",
       "  'indirect_paths': 32,\n",
       "  'reversed_indirect_paths': 71,\n",
       "  'no_connections': 92,\n",
       "  'common_parents': 20,\n",
       "  'common_childs': 20},\n",
       " 'C': {'direct_edges': 2,\n",
       "  'reversed_edges': 9,\n",
       "  'indirect_paths': 69,\n",
       "  'reversed_indirect_paths': 74,\n",
       "  'no_connections': 232,\n",
       "  'common_parents': 53,\n",
       "  'common_childs': 53}}"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# calculate the sum of the number of direct_edges, etc of all datasets grouped by answers in answer_type_dict\n",
    "answer_type_sum = {k:{\"direct_edges\":0,\"reversed_edges\":0,\"indirect_paths\":0,\"reversed_indirect_paths\":0,\"no_connections\":0, \"common_parents\":0, \"common_childs\":0} for k in [\"A\",\"B\",\"C\"]}\n",
    "for d in datasets:\n",
    "    for k in answer_type_dict[d]:\n",
    "        for kk in answer_type_dict[d][k]:\n",
    "            answer_type_sum[k][kk] += len(answer_type_dict[d][k][kk])\n",
    "answer_type_sum"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "LLMCSL",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.17"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
