{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import sys\n",
    "sys.path.append(\"../\")\n",
    "sys.path.append(\"../../\")\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "from pythautomata.utilities import pdfa_generator\n",
    "from pythautomata.utilities import nicaud_dfa_generator\n",
    "from src import utils, constants\n",
    "from pythautomata.model_exporters.dot_exporters.wfa_dot_exporting_strategy import WFADotExportingStrategy\n",
    "from IPython.display import display\n",
    "from src.hypothesis_aware_sample_probabilistic_teacher import HypothesisAwareSampleProbabilisticTeacher\n",
    "from src.syncronic_model_guided_language_model import SyncronicModelGuidedLanguageModel\n",
    "from pymodelextractor.teachers.sample_probabilistic_teacher import SampleProbabilisticTeacher\n",
    "from pythautomata.utilities.probability_partitioner import QuantizationProbabilityPartitioner\n",
    "from pythautomata.model_comparators.wfa_partition_comparison_strategy import WFAPartitionComparator\n",
    "from pythautomata.utilities.guiding_wfa_sequence_generator import GuidingWDFASequenceGenerator\n",
    "from pymodelextractor.learners.observation_tree_learners.pdfa_quantization_n_ary_tree_learner import PDFAQuantizationNAryTreeLearner"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Create a random PDFA with zero-transitions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/svg+xml": [
       "<?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?>\n",
       "<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n",
       " \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\n",
       "<!-- Generated by graphviz version 2.47.1 (20210417.1919)\n",
       " -->\n",
       "<!-- Title: weighted_automaton Pages: 1 -->\n",
       "<svg width=\"427pt\" height=\"150pt\"\n",
       " viewBox=\"0.00 0.00 426.74 150.37\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
       "<g id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 146.37)\">\n",
       "<title>weighted_automaton</title>\n",
       "<polygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-146.37 422.74,-146.37 422.74,4 -4,4\"/>\n",
       "<!-- 0 -->\n",
       "<g id=\"node1\" class=\"node\">\n",
       "<title>0</title>\n",
       "<polygon fill=\"none\" stroke=\"black\" points=\"61,-97.13 0,-59.13 61,-21.13 122,-59.13 61,-97.13\"/>\n",
       "<text text-anchor=\"middle\" x=\"61\" y=\"-62.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0</text>\n",
       "<text text-anchor=\"middle\" x=\"61\" y=\"-47.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.69132</text>\n",
       "</g>\n",
       "<!-- 1 -->\n",
       "<g id=\"node2\" class=\"node\">\n",
       "<title>1</title>\n",
       "<ellipse fill=\"none\" stroke=\"black\" cx=\"220.23\" cy=\"-109.13\" rx=\"33.47\" ry=\"33.47\"/>\n",
       "<text text-anchor=\"middle\" x=\"220.23\" y=\"-112.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1</text>\n",
       "<text text-anchor=\"middle\" x=\"220.23\" y=\"-97.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.523</text>\n",
       "</g>\n",
       "<!-- 0&#45;&gt;1 -->\n",
       "<g id=\"edge1\" class=\"edge\">\n",
       "<title>0&#45;&gt;1</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M96.42,-75.35C109.81,-81.22 125.42,-87.53 140,-92.13 151.95,-95.91 165.17,-99.11 177.34,-101.69\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"176.76,-105.14 187.26,-103.7 178.16,-98.28 176.76,-105.14\"/>\n",
       "<text text-anchor=\"middle\" x=\"154.5\" y=\"-102.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0.0</text>\n",
       "</g>\n",
       "<!-- 5 -->\n",
       "<g id=\"node3\" class=\"node\">\n",
       "<title>5</title>\n",
       "<ellipse fill=\"none\" stroke=\"black\" cx=\"375.6\" cy=\"-43.13\" rx=\"43.27\" ry=\"43.27\"/>\n",
       "<text text-anchor=\"middle\" x=\"375.6\" y=\"-46.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">5</text>\n",
       "<text text-anchor=\"middle\" x=\"375.6\" y=\"-31.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.11519</text>\n",
       "</g>\n",
       "<!-- 0&#45;&gt;5 -->\n",
       "<g id=\"edge2\" class=\"edge\">\n",
       "<title>0&#45;&gt;5</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M117.07,-55.95C138.85,-54.72 164.1,-53.32 187,-52.13 232.69,-49.76 284.65,-47.28 322.28,-45.53\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"322.67,-49.02 332.5,-45.06 322.35,-42.02 322.67,-49.02\"/>\n",
       "<text text-anchor=\"middle\" x=\"220.23\" y=\"-55.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.30868</text>\n",
       "</g>\n",
       "<!-- 1&#45;&gt;0 -->\n",
       "<g id=\"edge3\" class=\"edge\">\n",
       "<title>1&#45;&gt;0</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M194.59,-87.83C186.86,-82.18 177.98,-76.68 169,-73.13 156.43,-68.17 142.45,-64.9 128.86,-62.75\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"128.95,-59.23 118.56,-61.32 127.99,-66.16 128.95,-59.23\"/>\n",
       "<text text-anchor=\"middle\" x=\"154.5\" y=\"-76.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0.0</text>\n",
       "</g>\n",
       "<!-- 1&#45;&gt;5 -->\n",
       "<g id=\"edge4\" class=\"edge\">\n",
       "<title>1&#45;&gt;5</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M251.17,-96.25C272.58,-87.04 301.86,-74.44 326.52,-63.82\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"327.92,-67.03 335.72,-59.86 325.15,-60.6 327.92,-67.03\"/>\n",
       "<text text-anchor=\"middle\" x=\"292.97\" y=\"-88.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.477</text>\n",
       "</g>\n",
       "<!-- 5&#45;&gt;0 -->\n",
       "<g id=\"edge5\" class=\"edge\">\n",
       "<title>5&#45;&gt;0</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M334.64,-29.38C296.61,-18.08 237.81,-5.27 187,-14.13 159.14,-19 129.3,-29.52 105.76,-39.17\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"104.27,-36 96.41,-43.09 106.98,-42.45 104.27,-36\"/>\n",
       "<text text-anchor=\"middle\" x=\"220.23\" y=\"-32.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0.0</text>\n",
       "<text text-anchor=\"middle\" x=\"220.23\" y=\"-17.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.88481</text>\n",
       "</g>\n",
       "</g>\n",
       "</svg>\n"
      ],
      "text/plain": [
       "<graphviz.graphs.Digraph at 0x2c876015790>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "size = 5\n",
    "dfa = nicaud_dfa_generator.generate_dfa(alphabet = constants.binaryAlphabet, nominal_size= size, seed = 42)\n",
    "dfa.name = \"random_PDFA_nominal_size_\"+str(size)   \n",
    "pdfa = pdfa_generator.pdfa_from_dfa(dfa, zero_probability=0.3)  \n",
    "\n",
    "\n",
    "exporter = WFADotExportingStrategy()\n",
    "graph = exporter.create_graph(pdfa)\n",
    "\n",
    "display(graph)    "
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Extractions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "max_seq_length = 10\n",
    "partitions = 1000   \n",
    "partitioner = QuantizationProbabilityPartitioner(partitions)\n",
    "partition_comparator = WFAPartitionComparator(partitioner)\n",
    "teacher1 = HypothesisAwareSampleProbabilisticTeacher(model = pdfa, comparator = partition_comparator, sample_size = 1000, max_seq_length = max_seq_length)\n",
    "learner1 = PDFAQuantizationNAryTreeLearner(omit_zero_transitions = True, probabilityPartitioner = partitioner, check_probabilistic_hipothesis = False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/svg+xml": [
       "<?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?>\n",
       "<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n",
       " \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\n",
       "<!-- Generated by graphviz version 2.47.1 (20210417.1919)\n",
       " -->\n",
       "<!-- Title: weighted_automaton Pages: 1 -->\n",
       "<svg width=\"438pt\" height=\"138pt\"\n",
       " viewBox=\"0.00 0.00 438.22 138.48\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
       "<g id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 134.48)\">\n",
       "<title>weighted_automaton</title>\n",
       "<polygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-134.48 434.22,-134.48 434.22,4 -4,4\"/>\n",
       "<!-- 0 -->\n",
       "<g id=\"node1\" class=\"node\">\n",
       "<title>0</title>\n",
       "<ellipse fill=\"none\" stroke=\"black\" cx=\"43.13\" cy=\"-54.48\" rx=\"43.27\" ry=\"43.27\"/>\n",
       "<text text-anchor=\"middle\" x=\"43.13\" y=\"-58.28\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0</text>\n",
       "<text text-anchor=\"middle\" x=\"43.13\" y=\"-43.28\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.11519</text>\n",
       "</g>\n",
       "<!-- ϵ -->\n",
       "<g id=\"node2\" class=\"node\">\n",
       "<title>ϵ</title>\n",
       "<polygon fill=\"none\" stroke=\"black\" points=\"239.27,-130.48 178.27,-92.48 239.27,-54.48 300.27,-92.48 239.27,-130.48\"/>\n",
       "<text text-anchor=\"middle\" x=\"239.27\" y=\"-96.28\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">ϵ</text>\n",
       "<text text-anchor=\"middle\" x=\"239.27\" y=\"-81.28\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.69132</text>\n",
       "</g>\n",
       "<!-- 0&#45;&gt;ϵ -->\n",
       "<g id=\"edge1\" class=\"edge\">\n",
       "<title>0&#45;&gt;ϵ</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M84.76,-65.86C91.26,-67.52 97.93,-69.12 104.27,-70.48 128.56,-75.69 155.57,-80.34 178.93,-84.01\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"178.63,-87.5 189.05,-85.57 179.7,-80.58 178.63,-87.5\"/>\n",
       "<text text-anchor=\"middle\" x=\"132.27\" y=\"-84.28\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.88481</text>\n",
       "</g>\n",
       "<!-- HOLE -->\n",
       "<g id=\"node3\" class=\"node\">\n",
       "<title>HOLE</title>\n",
       "<ellipse fill=\"none\" stroke=\"black\" cx=\"392.74\" cy=\"-37.48\" rx=\"37.45\" ry=\"37.45\"/>\n",
       "<text text-anchor=\"middle\" x=\"392.74\" y=\"-41.28\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">HOLE</text>\n",
       "<text text-anchor=\"middle\" x=\"392.74\" y=\"-26.28\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1</text>\n",
       "</g>\n",
       "<!-- 0&#45;&gt;HOLE -->\n",
       "<g id=\"edge2\" class=\"edge\">\n",
       "<title>0&#45;&gt;HOLE</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M85.5,-46.02C91.78,-44.79 98.19,-43.58 104.27,-42.48 137.05,-36.55 145.06,-33.15 178.27,-30.48 232.31,-26.12 246.08,-28.41 300.27,-30.48 314.87,-31.03 330.75,-32.09 345.12,-33.22\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"345.03,-36.72 355.28,-34.04 345.6,-29.74 345.03,-36.72\"/>\n",
       "<text text-anchor=\"middle\" x=\"239.27\" y=\"-34.28\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0</text>\n",
       "</g>\n",
       "<!-- ϵ&#45;&gt;0 -->\n",
       "<g id=\"edge4\" class=\"edge\">\n",
       "<title>ϵ&#45;&gt;0</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M209.26,-72.92C195.13,-64.55 177.5,-55.73 160.27,-51.48 139.58,-46.37 116.19,-45.99 95.85,-47.3\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"95.52,-43.82 85.83,-48.1 96.07,-50.8 95.52,-43.82\"/>\n",
       "<text text-anchor=\"middle\" x=\"132.27\" y=\"-55.28\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.30868</text>\n",
       "</g>\n",
       "<!-- ϵ&#45;&gt;HOLE -->\n",
       "<g id=\"edge5\" class=\"edge\">\n",
       "<title>ϵ&#45;&gt;HOLE</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M278.49,-78.6C299.56,-70.95 325.82,-61.41 347.74,-53.45\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"348.95,-56.74 357.16,-50.03 346.56,-50.16 348.95,-56.74\"/>\n",
       "<text text-anchor=\"middle\" x=\"327.77\" y=\"-66.28\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0</text>\n",
       "</g>\n",
       "<!-- HOLE&#45;&gt;HOLE -->\n",
       "<g id=\"edge3\" class=\"edge\">\n",
       "<title>HOLE&#45;&gt;HOLE</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M380.76,-73.23C381,-84.28 384.99,-92.95 392.74,-92.95 397.83,-92.95 401.3,-89.22 403.15,-83.52\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"406.67,-83.64 404.73,-73.23 399.76,-82.58 406.67,-83.64\"/>\n",
       "<text text-anchor=\"middle\" x=\"392.74\" y=\"-111.75\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0</text>\n",
       "<text text-anchor=\"middle\" x=\"392.74\" y=\"-96.75\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0</text>\n",
       "</g>\n",
       "</g>\n",
       "</svg>\n"
      ],
      "text/plain": [
       "<graphviz.graphs.Digraph at 0x2c806ba45b0>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "result = learner1.learn(teacher1)\n",
    "graph = exporter.create_graph(result.model)\n",
    "display(graph) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "undefined_ouput = np.zeros(len(pdfa.alphabet)+1)\n",
    "synchronic_model = SyncronicModelGuidedLanguageModel(pdfa, guiding_model=None, model_name= pdfa.name+\"_SYNCH\", max_seq_length=10, \n",
    "                                                        normalize_outputs=False, top_k=len(pdfa.alphabet)+1, check_is_defined=True, \n",
    "                                                        undefined_ouput=undefined_ouput)\n",
    "teacher2 =  SampleProbabilisticTeacher(synchronic_model, comparator = partition_comparator, sample_size = 100, max_seq_length = 25)\n",
    "learner2 = PDFAQuantizationNAryTreeLearner(omit_zero_transitions = False, probabilityPartitioner = partitioner, check_probabilistic_hipothesis = False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/svg+xml": [
       "<?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?>\n",
       "<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n",
       " \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\n",
       "<!-- Generated by graphviz version 2.47.1 (20210417.1919)\n",
       " -->\n",
       "<!-- Title: weighted_automaton Pages: 1 -->\n",
       "<svg width=\"427pt\" height=\"128pt\"\n",
       " viewBox=\"0.00 0.00 427.01 127.87\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
       "<g id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 123.87)\">\n",
       "<title>weighted_automaton</title>\n",
       "<polygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-123.87 423.01,-123.87 423.01,4 -4,4\"/>\n",
       "<!-- 0 -->\n",
       "<g id=\"node1\" class=\"node\">\n",
       "<title>0</title>\n",
       "<ellipse fill=\"none\" stroke=\"black\" cx=\"43.13\" cy=\"-43.87\" rx=\"43.27\" ry=\"43.27\"/>\n",
       "<text text-anchor=\"middle\" x=\"43.13\" y=\"-47.67\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0</text>\n",
       "<text text-anchor=\"middle\" x=\"43.13\" y=\"-32.67\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.11519</text>\n",
       "</g>\n",
       "<!-- ϵ -->\n",
       "<g id=\"node2\" class=\"node\">\n",
       "<title>ϵ</title>\n",
       "<polygon fill=\"none\" stroke=\"black\" points=\"239.27,-119.87 178.27,-81.87 239.27,-43.87 300.27,-81.87 239.27,-119.87\"/>\n",
       "<text text-anchor=\"middle\" x=\"239.27\" y=\"-85.67\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">ϵ</text>\n",
       "<text text-anchor=\"middle\" x=\"239.27\" y=\"-70.67\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.69132</text>\n",
       "</g>\n",
       "<!-- 0&#45;&gt;ϵ -->\n",
       "<g id=\"edge1\" class=\"edge\">\n",
       "<title>0&#45;&gt;ϵ</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M84.76,-55.25C91.26,-56.91 97.93,-58.51 104.27,-59.87 128.56,-65.08 155.57,-69.73 178.93,-73.4\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"178.63,-76.89 189.05,-74.96 179.7,-69.98 178.63,-76.89\"/>\n",
       "<text text-anchor=\"middle\" x=\"132.27\" y=\"-73.67\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.88481</text>\n",
       "</g>\n",
       "<!-- 1 -->\n",
       "<g id=\"node3\" class=\"node\">\n",
       "<title>1</title>\n",
       "<ellipse fill=\"none\" stroke=\"black\" cx=\"392.14\" cy=\"-26.87\" rx=\"26.74\" ry=\"26.74\"/>\n",
       "<text text-anchor=\"middle\" x=\"392.14\" y=\"-30.67\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1</text>\n",
       "<text text-anchor=\"middle\" x=\"392.14\" y=\"-15.67\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.0</text>\n",
       "</g>\n",
       "<!-- 0&#45;&gt;1 -->\n",
       "<g id=\"edge2\" class=\"edge\">\n",
       "<title>0&#45;&gt;1</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M85.5,-35.41C91.78,-34.19 98.19,-32.97 104.27,-31.87 137.05,-25.94 145.06,-22.55 178.27,-19.87 232.31,-15.52 246.08,-17.79 300.27,-19.87 318.3,-20.56 338.29,-22.03 354.93,-23.44\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"355.05,-26.96 365.32,-24.35 355.66,-19.99 355.05,-26.96\"/>\n",
       "<text text-anchor=\"middle\" x=\"239.27\" y=\"-23.67\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0.0</text>\n",
       "</g>\n",
       "<!-- ϵ&#45;&gt;0 -->\n",
       "<g id=\"edge4\" class=\"edge\">\n",
       "<title>ϵ&#45;&gt;0</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M209.26,-62.31C195.13,-53.94 177.5,-45.12 160.27,-40.87 139.58,-35.76 116.19,-35.38 95.85,-36.7\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"95.52,-33.21 85.83,-37.49 96.07,-40.19 95.52,-33.21\"/>\n",
       "<text text-anchor=\"middle\" x=\"132.27\" y=\"-44.67\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.30868</text>\n",
       "</g>\n",
       "<!-- ϵ&#45;&gt;1 -->\n",
       "<g id=\"edge5\" class=\"edge\">\n",
       "<title>ϵ&#45;&gt;1</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M278.34,-67.99C302.47,-59.19 333.44,-47.9 356.82,-39.38\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"358.13,-42.63 366.33,-35.91 355.74,-36.05 358.13,-42.63\"/>\n",
       "<text text-anchor=\"middle\" x=\"332.77\" y=\"-55.67\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0.0</text>\n",
       "</g>\n",
       "<!-- 1&#45;&gt;1 -->\n",
       "<g id=\"edge3\" class=\"edge\">\n",
       "<title>1&#45;&gt;1</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M381.39,-51.79C380.51,-62.54 384.09,-71.74 392.14,-71.74 397.42,-71.74 400.77,-67.78 402.21,-62.01\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"405.72,-62 402.88,-51.79 398.73,-61.53 405.72,-62\"/>\n",
       "<text text-anchor=\"middle\" x=\"392.14\" y=\"-90.54\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.0</text>\n",
       "<text text-anchor=\"middle\" x=\"392.14\" y=\"-75.54\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0.0</text>\n",
       "</g>\n",
       "</g>\n",
       "</svg>\n"
      ],
      "text/plain": [
       "<graphviz.graphs.Digraph at 0x2c806ba4580>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "result2 = learner2.learn(teacher2)\n",
    "graph = exporter.create_graph(result2.model)\n",
    "display(graph) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/svg+xml": [
       "<?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?>\n",
       "<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n",
       " \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\n",
       "<!-- Generated by graphviz version 2.47.1 (20210417.1919)\n",
       " -->\n",
       "<!-- Title: weighted_automaton Pages: 1 -->\n",
       "<svg width=\"440pt\" height=\"127pt\"\n",
       " viewBox=\"0.00 0.00 439.74 127.13\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
       "<g id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 123.13)\">\n",
       "<title>weighted_automaton</title>\n",
       "<polygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-123.13 435.74,-123.13 435.74,4 -4,4\"/>\n",
       "<!-- 0 -->\n",
       "<g id=\"node1\" class=\"node\">\n",
       "<title>0</title>\n",
       "<ellipse fill=\"none\" stroke=\"black\" cx=\"43.13\" cy=\"-43.13\" rx=\"43.27\" ry=\"43.27\"/>\n",
       "<text text-anchor=\"middle\" x=\"43.13\" y=\"-46.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0</text>\n",
       "<text text-anchor=\"middle\" x=\"43.13\" y=\"-31.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.11519</text>\n",
       "</g>\n",
       "<!-- ϵ -->\n",
       "<g id=\"node2\" class=\"node\">\n",
       "<title>ϵ</title>\n",
       "<polygon fill=\"none\" stroke=\"black\" points=\"239.27,-119.13 178.27,-81.13 239.27,-43.13 300.27,-81.13 239.27,-119.13\"/>\n",
       "<text text-anchor=\"middle\" x=\"239.27\" y=\"-84.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">ϵ</text>\n",
       "<text text-anchor=\"middle\" x=\"239.27\" y=\"-69.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.69132</text>\n",
       "</g>\n",
       "<!-- 0&#45;&gt;ϵ -->\n",
       "<g id=\"edge1\" class=\"edge\">\n",
       "<title>0&#45;&gt;ϵ</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M84.76,-54.52C91.26,-56.17 97.93,-57.77 104.27,-59.13 128.56,-64.35 155.57,-69 178.93,-72.66\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"178.63,-76.16 189.05,-74.23 179.7,-69.24 178.63,-76.16\"/>\n",
       "<text text-anchor=\"middle\" x=\"132.27\" y=\"-87.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.88481</text>\n",
       "<text text-anchor=\"middle\" x=\"132.27\" y=\"-72.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0.0</text>\n",
       "</g>\n",
       "<!-- ϵ&#45;&gt;0 -->\n",
       "<g id=\"edge4\" class=\"edge\">\n",
       "<title>ϵ&#45;&gt;0</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M209.26,-61.57C195.13,-53.2 177.5,-44.39 160.27,-40.13 139.58,-35.03 116.19,-34.65 95.85,-35.96\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"95.52,-32.48 85.83,-36.76 96.07,-39.45 95.52,-32.48\"/>\n",
       "<text text-anchor=\"middle\" x=\"132.27\" y=\"-43.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.30868</text>\n",
       "</g>\n",
       "<!-- 1 -->\n",
       "<g id=\"node3\" class=\"node\">\n",
       "<title>1</title>\n",
       "<ellipse fill=\"none\" stroke=\"black\" cx=\"398.5\" cy=\"-43.13\" rx=\"33.47\" ry=\"33.47\"/>\n",
       "<text text-anchor=\"middle\" x=\"398.5\" y=\"-46.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1</text>\n",
       "<text text-anchor=\"middle\" x=\"398.5\" y=\"-31.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.523</text>\n",
       "</g>\n",
       "<!-- ϵ&#45;&gt;1 -->\n",
       "<g id=\"edge5\" class=\"edge\">\n",
       "<title>ϵ&#45;&gt;1</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M286.86,-72.66C305.72,-68.95 327.63,-64.26 347.27,-59.13 350.46,-58.3 353.74,-57.39 357.03,-56.43\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"358.27,-59.71 366.83,-53.47 356.25,-53.01 358.27,-59.71\"/>\n",
       "<text text-anchor=\"middle\" x=\"332.77\" y=\"-68.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0.0</text>\n",
       "</g>\n",
       "<!-- 1&#45;&gt;0 -->\n",
       "<g id=\"edge2\" class=\"edge\">\n",
       "<title>1&#45;&gt;0</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M366.33,-33.4C347.43,-28.01 322.71,-21.86 300.27,-19.13 213.63,-8.6 190.15,-15.61 104.27,-31.13 101.42,-31.65 98.5,-32.19 95.55,-32.74\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"94.66,-29.35 85.5,-34.67 95.98,-36.23 94.66,-29.35\"/>\n",
       "<text text-anchor=\"middle\" x=\"239.27\" y=\"-22.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.477</text>\n",
       "</g>\n",
       "<!-- 1&#45;&gt;ϵ -->\n",
       "<g id=\"edge3\" class=\"edge\">\n",
       "<title>1&#45;&gt;ϵ</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M365.13,-40.44C350.62,-40.02 333.41,-40.62 318.27,-44.13 305.36,-47.12 292.07,-52.46 280.2,-58.16\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"278.38,-55.16 271.02,-62.78 281.53,-61.42 278.38,-55.16\"/>\n",
       "<text text-anchor=\"middle\" x=\"332.77\" y=\"-47.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0.0</text>\n",
       "</g>\n",
       "</g>\n",
       "</svg>\n"
      ],
      "text/plain": [
       "<graphviz.graphs.Digraph at 0x2c806bf5040>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "teacher3 =  SampleProbabilisticTeacher(pdfa, comparator = partition_comparator, sample_size = 100, max_seq_length = 25)\n",
    "learner3 = PDFAQuantizationNAryTreeLearner(omit_zero_transitions = False, probabilityPartitioner = partitioner, check_probabilistic_hipothesis = False)\n",
    "result3 = learner3.learn(teacher3)\n",
    "graph = exporter.create_graph(result3.model)\n",
    "display(graph) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/svg+xml": [
       "<?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?>\n",
       "<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n",
       " \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\n",
       "<!-- Generated by graphviz version 2.47.1 (20210417.1919)\n",
       " -->\n",
       "<!-- Title: weighted_automaton Pages: 1 -->\n",
       "<svg width=\"427pt\" height=\"150pt\"\n",
       " viewBox=\"0.00 0.00 426.74 150.37\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
       "<g id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 146.37)\">\n",
       "<title>weighted_automaton</title>\n",
       "<polygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-146.37 422.74,-146.37 422.74,4 -4,4\"/>\n",
       "<!-- 0 -->\n",
       "<g id=\"node1\" class=\"node\">\n",
       "<title>0</title>\n",
       "<polygon fill=\"none\" stroke=\"black\" points=\"61,-97.13 0,-59.13 61,-21.13 122,-59.13 61,-97.13\"/>\n",
       "<text text-anchor=\"middle\" x=\"61\" y=\"-62.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0</text>\n",
       "<text text-anchor=\"middle\" x=\"61\" y=\"-47.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.69132</text>\n",
       "</g>\n",
       "<!-- 1 -->\n",
       "<g id=\"node2\" class=\"node\">\n",
       "<title>1</title>\n",
       "<ellipse fill=\"none\" stroke=\"black\" cx=\"220.23\" cy=\"-109.13\" rx=\"33.47\" ry=\"33.47\"/>\n",
       "<text text-anchor=\"middle\" x=\"220.23\" y=\"-112.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1</text>\n",
       "<text text-anchor=\"middle\" x=\"220.23\" y=\"-97.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.523</text>\n",
       "</g>\n",
       "<!-- 0&#45;&gt;1 -->\n",
       "<g id=\"edge1\" class=\"edge\">\n",
       "<title>0&#45;&gt;1</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M96.42,-75.35C109.81,-81.22 125.42,-87.53 140,-92.13 151.95,-95.91 165.17,-99.11 177.34,-101.69\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"176.76,-105.14 187.26,-103.7 178.16,-98.28 176.76,-105.14\"/>\n",
       "<text text-anchor=\"middle\" x=\"154.5\" y=\"-102.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0.0</text>\n",
       "</g>\n",
       "<!-- 5 -->\n",
       "<g id=\"node3\" class=\"node\">\n",
       "<title>5</title>\n",
       "<ellipse fill=\"none\" stroke=\"black\" cx=\"375.6\" cy=\"-43.13\" rx=\"43.27\" ry=\"43.27\"/>\n",
       "<text text-anchor=\"middle\" x=\"375.6\" y=\"-46.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">5</text>\n",
       "<text text-anchor=\"middle\" x=\"375.6\" y=\"-31.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0.11519</text>\n",
       "</g>\n",
       "<!-- 0&#45;&gt;5 -->\n",
       "<g id=\"edge2\" class=\"edge\">\n",
       "<title>0&#45;&gt;5</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M117.07,-55.95C138.85,-54.72 164.1,-53.32 187,-52.13 232.69,-49.76 284.65,-47.28 322.28,-45.53\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"322.67,-49.02 332.5,-45.06 322.35,-42.02 322.67,-49.02\"/>\n",
       "<text text-anchor=\"middle\" x=\"220.23\" y=\"-55.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.30868</text>\n",
       "</g>\n",
       "<!-- 1&#45;&gt;0 -->\n",
       "<g id=\"edge3\" class=\"edge\">\n",
       "<title>1&#45;&gt;0</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M194.59,-87.83C186.86,-82.18 177.98,-76.68 169,-73.13 156.43,-68.17 142.45,-64.9 128.86,-62.75\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"128.95,-59.23 118.56,-61.32 127.99,-66.16 128.95,-59.23\"/>\n",
       "<text text-anchor=\"middle\" x=\"154.5\" y=\"-76.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0.0</text>\n",
       "</g>\n",
       "<!-- 1&#45;&gt;5 -->\n",
       "<g id=\"edge4\" class=\"edge\">\n",
       "<title>1&#45;&gt;5</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M251.17,-96.25C272.58,-87.04 301.86,-74.44 326.52,-63.82\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"327.92,-67.03 335.72,-59.86 325.15,-60.6 327.92,-67.03\"/>\n",
       "<text text-anchor=\"middle\" x=\"292.97\" y=\"-88.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.477</text>\n",
       "</g>\n",
       "<!-- 5&#45;&gt;0 -->\n",
       "<g id=\"edge5\" class=\"edge\">\n",
       "<title>5&#45;&gt;0</title>\n",
       "<path fill=\"none\" stroke=\"black\" d=\"M334.64,-29.38C296.61,-18.08 237.81,-5.27 187,-14.13 159.14,-19 129.3,-29.52 105.76,-39.17\"/>\n",
       "<polygon fill=\"black\" stroke=\"black\" points=\"104.27,-36 96.41,-43.09 106.98,-42.45 104.27,-36\"/>\n",
       "<text text-anchor=\"middle\" x=\"220.23\" y=\"-32.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">1&#45;0.0</text>\n",
       "<text text-anchor=\"middle\" x=\"220.23\" y=\"-17.93\" font-family=\"Times New Roman,serif\" font-size=\"14.00\">0&#45;0.88481</text>\n",
       "</g>\n",
       "</g>\n",
       "</svg>\n"
      ],
      "text/plain": [
       "<graphviz.graphs.Digraph at 0x2c806bf5ee0>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "graph = exporter.create_graph(pdfa)\n",
    "\n",
    "display(graph) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "sg2 = GuidingWDFASequenceGenerator(pdfa, max_seq_length, random_seed=42)\n",
    "sequences_in_target = sg2.generate_words(100)  "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "False"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from pythautomata.base_types.sequence import Sequence\n",
    "from pythautomata.base_types.symbol import SymbolStr\n",
    "sequence = Sequence([SymbolStr('0'), SymbolStr('1')])\n",
    "synchronic_model.check_sequence_is_defined(sequence)"
   ]
  }
 ],
 "metadata": {
  "interpreter": {
   "hash": "ccd85e264f409eb34496ed1f618ace649acf293164c04c6c014b744b9959793c"
  },
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.19"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
