import random
from nltk.grammar import Nonterminal
import numpy as np
from scipy.stats import skewnorm


grammar_dict = {
    "pcfg_example_regular": """
        S ->  [0.1]
        S -> 'a' S [0.45]
        S -> 'b' S [0.45]
    """,

    "pcfg_example_context_free": """
        S ->  [0.1]
        S -> 'a' S 'a' [0.45]
        S -> 'b' S 'b' [0.45]
    """,

    "pcfg_example_context_free_2": """
        S -> NOUN TENSE VERB [1]
        NOUN -> 'BlueBomber' [0.25] 
        NOUN ->  'Grijesh'  [0.25]
        NOUN ->  'I'  [0.25]
        NOUN ->  'We'  [0.25]
        TENSE ->  'am' [0.25]
        TENSE ->  'was' [0.25]
        TENSE ->  'is' [0.25]
        TENSE ->  'were' [0.25]
        VERB  ->  'going' [0.333]
        VERB  ->  'eating' [0.333]
        VERB  ->  'working' [0.333]
    """,

    "pcfg_example_context_sensitive": """
        S -> NOUN TENSE VERB [1]
        NOUN -> 'BlueBomber' [0.25] 
        NOUN ->  'Grijesh'  [0.25]
        NOUN ->  'I'  [0.25]
        NOUN ->  'We'  [0.25]
        
        'I' TENSE ->  'am' [1]

        'I' TENSE ->  'was' [0.333]
        'Grijesh' TENSE ->  'was' [0.333]
        'BlueBomber' TENSE ->  'was' [0.333]


        TENSE ->  'is' [0.25]
        TENSE ->  'were' [0.25]
        
        
        VERB  ->  'going' [0.333]
        VERB  ->  'eating' [0.333]
        VERB  ->  'working' [0.333]
    """,


    "ab_repeated": """
        S -> 'a' 'b' | 'a' 'b' S
    """,

    "abc_repeated": """
        S -> 'a' 'b' 'c' | 'a' 'b' 'c' S
    """,

    "anbn": """
        S -> 'a' 'b' | 'a' S 'b'
    """,

    "balanced_parenthesis_nested": """
        S -> '(' ')' | '(' S ')'
    """,

    "balanced_parenthesis": """
        S -> '('')'
        S -> '['']'
        S -> '{''}'
        S -> '(' S ')'
        S -> '[' S ']'
        S -> '{' S '}'
        S -> S S
    """,

    "pcfg_ab_repeated": """
        S -> 'a' 'b' [0.1] | 'a' 'b' S [0.9]
    """,

    
    "pcfg_balanced_parenthesis": """
        S -> S1 [1]
        S1 -> A1 [0.3]
        S1 -> A2 [0.3]
        S1 -> A3 [0.3]
        S1 -> S1 S1 [0.1]
        A1 -> '('')' [0.3]
        A1 -> '('S1')' [0.7]
        A2 -> '['']' [0.3]
        A2 -> '['S1']' [0.7]
        A3 -> '{''}' [0.3]
        A3 -> '{'S1'}' [0.7]
        """,

    "pcfg_reverse_string": """
        S -> A1 [1]
        A1 -> 'a' A1 'a' [0.475]
        A1 -> 'b' A1 'b' [0.475]
        A1 ->  [0.05]
    """,

    "pcfg_one_character_missing": """
        S -> B [0.1666]
        S -> C [0.1666]
        S -> A [0.1666]
        S -> C [0.1666]
        S -> A [0.1666]
        S -> B [0.1666]
        A -> 'b' A [0.495]
        A -> 'b' [0.005]
        A -> 'c' A [0.495]
        A -> 'c' [0.005]
        B -> 'a' B [0.495]
        B -> 'a' [0.005]
        B -> 'c' B [0.495]
        B -> 'c' [0.005]
        C -> 'a' C [0.495]
        C -> 'a' [0.005]
        C -> 'b' C [0.495]
        C -> 'b' [0.005]
    """,

    "example_1": """
        S -> NP VP
        S -> Aux NP VP
        S -> VP
        NP -> Det NOM
        NOM -> Noun
        NOM -> Noun NOM
        VP -> Verb
        VP -> Verb NP
        Det -> 'that ' | 'this ' | 'a ' | 'the '
        Noun -> 'book ' | 'flight ' | 'meal ' | 'man '
        Verb -> 'book ' | 'include ' | 'read '
        Aux -> 'does '
    """, 


    "pcfg_ab": """
        S -> 'a' 'b' [0.01]
        S -> 'a' 'b' S [0.99]
    """,

    "pcfg_ab_aabb": """
            S -> A [0.5]
            S -> B [0.5]
            A -> 'a' 'b' [0.01]
            A -> 'a' 'b' A [0.99]
            B -> 'a' 'a' 'b' 'b' [0.01]
            B -> 'a' 'a' 'b' 'b' B [0.99]
    """,

    "pcfg_ab_aabb_mixed": """
            S -> 'a' 'b' [0.01]
            S -> 'a' 'a' 'b' 'b' [0.01]
            S -> 'a' 'b' S [0.49]
            S -> 'a' 'a' 'b' 'b' S [0.49]
    """,

    "cfg3b": """
        A22 -> A21 A20 
        A22 -> A20 A19 
        A19 -> A16 A17 A18 
        A19 -> A17 A18 A16 
        A20 -> A17 A16 A18 
        A20 -> A16 A17 
        A21 -> A18 A16 
        A21 -> A16 A18 A17 
        A16 -> A15 A13 
        A16 -> A13 A15 A14 
        A17 -> A14 A13 A15 
        A17 -> A15 A13 A14 
        A18 -> A15 A14 A13 
        A18 -> A14 A13 
        A13 -> A11 A12 
        A13 -> A12 A11 
        A14 -> A11 A10 A12 
        A14 -> A10 A11 A12 
        A15 -> A12 A11 A10 
        A15 -> A11 A12 A10 
        A10 -> A7 A9 A8 
        A10 -> A9 A8 A7 
        A11 -> A8 A7 A9 
        A11 -> A7 A8 A9 
        A12 -> A8 A9 A7 
        A12 -> A9 A7 A8 
        A7 -> '3' '1' 
        A7 -> '1' '2' '3' 
        A8 -> '3' '2' 
        A8 -> '3' '1' '2' 
        A9 -> '3' '2' '1' 
        A9 -> '2' '1'
    """,

    "pcfg_cfg3b": """
        A22 -> A21 A20 [0.50]
        A22 -> A20 A19 [0.50]
        A19 -> A16 A17 A18 [0.50]
        A19 -> A17 A18 A16 [0.50]
        A20 -> A17 A16 A18 [0.50]
        A20 -> A16 A17 [0.50]
        A21 -> A18 A16 [0.50]
        A21 -> A16 A18 A17 [0.50]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A17 -> A14 A13 A15 [0.50]
        A17 -> A15 A13 A14 [0.50]
        A18 -> A15 A14 A13 [0.50]
        A18 -> A14 A13 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.50]
        A7 -> '1' '2' '3' [0.50]
        A8 -> '6' '5' [0.50]
        A8 -> '6' '4' '5' [0.50]
        A9 -> '9' '8' '7' [0.50]
        A9 -> '8' '7' [0.50]
    """,


    "pcfg_cfg3b_disjoint_terminals_skewed_prob": """
        S -> A16 [1]
        A16 -> A15 A13 [0.90]
        A16 -> A13 A15 A14 [0.10]
        A13 -> A11 A12 [0.90]
        A13 -> A12 A11 [0.10]
        A14 -> A11 A10 A12 [0.90]
        A14 -> A10 A11 A12 [0.10]
        A15 -> A12 A11 A10 [0.90]
        A15 -> A11 A12 A10 [0.10]
        A10 -> A7 A9 A8 [0.90]
        A10 -> A9 A8 A7 [0.10]
        A11 -> A8 A7 A9 [0.90]
        A11 -> A7 A8 A9 [0.10]
        A12 -> A8 A9 A7 [0.90]
        A12 -> A9 A7 A8 [0.10]
        A7 -> '3' '1' [0.90]
        A7 -> '1' '2' '3' [0.10]
        A8 -> '6' '5' [0.90]
        A8 -> '6' '4' '5' [0.10]
        A9 -> '9' '8' '7' [0.90]
        A9 -> '8' '7' [0.10]
    """,


    "pcfg_cfg3b_disjoint_terminals": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.50]
        A7 -> '1' '2' '3' [0.50]
        A8 -> '6' '5' [0.50]
        A8 -> '6' '4' '5' [0.50]
        A9 -> '9' '8' '7' [0.50]
        A9 -> '8' '7' [0.50]
    """,


    "pcfg_cfg3b_disjoint_terminals_leaf_0.55": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.55]
        A7 -> '1' '2' '3' [0.45]
        A8 -> '6' '5' [0.55]
        A8 -> '6' '4' '5' [0.45]
        A9 -> '9' '8' '7' [0.55]
        A9 -> '8' '7' [0.45]
    """,


    "pcfg_cfg3b_disjoint_terminals_leaf_0.60": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.60]
        A7 -> '1' '2' '3' [0.40]
        A8 -> '6' '5' [0.60]
        A8 -> '6' '4' '5' [0.40]
        A9 -> '9' '8' '7' [0.60]
        A9 -> '8' '7' [0.40]
    """,


    "pcfg_cfg3b_disjoint_terminals_leaf_0.70": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.70]
        A7 -> '1' '2' '3' [0.30]
        A8 -> '6' '5' [0.70]
        A8 -> '6' '4' '5' [0.30]
        A9 -> '9' '8' '7' [0.70]
        A9 -> '8' '7' [0.30]
    """,


    "pcfg_cfg3b_disjoint_terminals_leaf_0.85": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.85]
        A7 -> '1' '2' '3' [0.15]
        A8 -> '6' '5' [0.85]
        A8 -> '6' '4' '5' [0.15]
        A9 -> '9' '8' '7' [0.85]
        A9 -> '8' '7' [0.15]
    """,


    "pcfg_cfg3b_disjoint_terminals_leaf_0.80": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.80]
        A7 -> '1' '2' '3' [0.20]
        A8 -> '6' '5' [0.80]
        A8 -> '6' '4' '5' [0.20]
        A9 -> '9' '8' '7' [0.80]
        A9 -> '8' '7' [0.20]
    """,


    "pcfg_cfg3b_disjoint_terminals_leaf_0.90": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.90]
        A7 -> '1' '2' '3' [0.10]
        A8 -> '6' '5' [0.90]
        A8 -> '6' '4' '5' [0.10]
        A9 -> '9' '8' '7' [0.90]
        A9 -> '8' '7' [0.10]
    """,



    "pcfg_cfg3b_disjoint_terminals_all_rules_0.55": """
        S -> A16 [1]
        A16 -> A15 A13 [0.55]
        A16 -> A13 A15 A14 [0.45]
        A13 -> A11 A12 [0.55]
        A13 -> A12 A11 [0.45]
        A14 -> A11 A10 A12 [0.55]
        A14 -> A10 A11 A12 [0.45]
        A15 -> A12 A11 A10 [0.55]
        A15 -> A11 A12 A10 [0.45]
        A10 -> A7 A9 A8 [0.55]
        A10 -> A9 A8 A7 [0.45]
        A11 -> A8 A7 A9 [0.55]
        A11 -> A7 A8 A9 [0.45]
        A12 -> A8 A9 A7 [0.55]
        A12 -> A9 A7 A8 [0.45]
        A7 -> '3' '1' [0.55]
        A7 -> '1' '2' '3' [0.45]
        A8 -> '6' '5' [0.55]
        A8 -> '6' '4' '5' [0.45]
        A9 -> '9' '8' '7' [0.55]
        A9 -> '8' '7' [0.45]
    """,


    "pcfg_cfg3b_disjoint_terminals_all_rules_0.60": """
        S -> A16 [1]
        A16 -> A15 A13 [0.60]
        A16 -> A13 A15 A14 [0.40]
        A13 -> A11 A12 [0.60]
        A13 -> A12 A11 [0.40]
        A14 -> A11 A10 A12 [0.60]
        A14 -> A10 A11 A12 [0.40]
        A15 -> A12 A11 A10 [0.60]
        A15 -> A11 A12 A10 [0.40]
        A10 -> A7 A9 A8 [0.60]
        A10 -> A9 A8 A7 [0.40]
        A11 -> A8 A7 A9 [0.60]
        A11 -> A7 A8 A9 [0.40]
        A12 -> A8 A9 A7 [0.60]
        A12 -> A9 A7 A8 [0.40]
        A7 -> '3' '1' [0.60]
        A7 -> '1' '2' '3' [0.40]
        A8 -> '6' '5' [0.60]
        A8 -> '6' '4' '5' [0.40]
        A9 -> '9' '8' '7' [0.60]
        A9 -> '8' '7' [0.40]
    """,


    "pcfg_cfg3b_disjoint_terminals_all_rules_0.70": """
        S -> A16 [1]
        A16 -> A15 A13 [0.70]
        A16 -> A13 A15 A14 [0.30]
        A13 -> A11 A12 [0.70]
        A13 -> A12 A11 [0.30]
        A14 -> A11 A10 A12 [0.70]
        A14 -> A10 A11 A12 [0.30]
        A15 -> A12 A11 A10 [0.70]
        A15 -> A11 A12 A10 [0.30]
        A10 -> A7 A9 A8 [0.70]
        A10 -> A9 A8 A7 [0.30]
        A11 -> A8 A7 A9 [0.70]
        A11 -> A7 A8 A9 [0.30]
        A12 -> A8 A9 A7 [0.70]
        A12 -> A9 A7 A8 [0.30]
        A7 -> '3' '1' [0.70]
        A7 -> '1' '2' '3' [0.30]
        A8 -> '6' '5' [0.70]
        A8 -> '6' '4' '5' [0.30]
        A9 -> '9' '8' '7' [0.70]
        A9 -> '8' '7' [0.30]
    """,




    "pcfg_cfg3b_disjoint_terminals_all_rules_0.80": """
        S -> A16 [1]
        A16 -> A15 A13 [0.80]
        A16 -> A13 A15 A14 [0.20]
        A13 -> A11 A12 [0.80]
        A13 -> A12 A11 [0.20]
        A14 -> A11 A10 A12 [0.80]
        A14 -> A10 A11 A12 [0.20]
        A15 -> A12 A11 A10 [0.80]
        A15 -> A11 A12 A10 [0.20]
        A10 -> A7 A9 A8 [0.80]
        A10 -> A9 A8 A7 [0.20]
        A11 -> A8 A7 A9 [0.80]
        A11 -> A7 A8 A9 [0.20]
        A12 -> A8 A9 A7 [0.80]
        A12 -> A9 A7 A8 [0.20]
        A7 -> '3' '1' [0.80]
        A7 -> '1' '2' '3' [0.20]
        A8 -> '6' '5' [0.80]
        A8 -> '6' '4' '5' [0.20]
        A9 -> '9' '8' '7' [0.80]
        A9 -> '8' '7' [0.20]
    """,


    "pcfg_cfg3b_disjoint_terminals_all_rules_0.90": """
        S -> A16 [1]
        A16 -> A15 A13 [0.90]
        A16 -> A13 A15 A14 [0.10]
        A13 -> A11 A12 [0.90]
        A13 -> A12 A11 [0.10]
        A14 -> A11 A10 A12 [0.90]
        A14 -> A10 A11 A12 [0.10]
        A15 -> A12 A11 A10 [0.90]
        A15 -> A11 A12 A10 [0.10]
        A10 -> A7 A9 A8 [0.90]
        A10 -> A9 A8 A7 [0.10]
        A11 -> A8 A7 A9 [0.90]
        A11 -> A7 A8 A9 [0.10]
        A12 -> A8 A9 A7 [0.90]
        A12 -> A9 A7 A8 [0.10]
        A7 -> '3' '1' [0.90]
        A7 -> '1' '2' '3' [0.10]
        A8 -> '6' '5' [0.90]
        A8 -> '6' '4' '5' [0.10]
        A9 -> '9' '8' '7' [0.90]
        A9 -> '8' '7' [0.10]
    """,



    "pcfg_cfg3b_disjoint_terminals_all_rules_0.95": """
        S -> A16 [1]
        A16 -> A15 A13 [0.95]
        A16 -> A13 A15 A14 [0.05]
        A13 -> A11 A12 [0.95]
        A13 -> A12 A11 [0.05]
        A14 -> A11 A10 A12 [0.95]
        A14 -> A10 A11 A12 [0.05]
        A15 -> A12 A11 A10 [0.95]
        A15 -> A11 A12 A10 [0.05]
        A10 -> A7 A9 A8 [0.95]
        A10 -> A9 A8 A7 [0.05]
        A11 -> A8 A7 A9 [0.95]
        A11 -> A7 A8 A9 [0.05]
        A12 -> A8 A9 A7 [0.95]
        A12 -> A9 A7 A8 [0.05]
        A7 -> '3' '1' [0.95]
        A7 -> '1' '2' '3' [0.05]
        A8 -> '6' '5' [0.95]
        A8 -> '6' '4' '5' [0.05]
        A9 -> '9' '8' '7' [0.95]
        A9 -> '8' '7' [0.05]
    """,



    "pcfg_cfg3b_disjoint_terminals_one_rule_different": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.50]
        A7 -> '1' '3' '2' [0.50]
        A8 -> '6' '5' [0.50]
        A8 -> '6' '4' '5' [0.50]
        A9 -> '9' '8' '7' [0.50]
        A9 -> '8' '7' [0.50]
    """,


    

    "pcfg_cfg3b_disjoint_terminals_two_rules_different": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.50]
        A7 -> '1' '3' '2' [0.50]
        A8 -> '5' '6' [0.50]
        A8 -> '6' '4' '5' [0.50]
        A9 -> '9' '8' '7' [0.50]
        A9 -> '8' '7' [0.50]
    """,


    "pcfg_cfg3b_disjoint_terminals_three_rules_different": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.50]
        A7 -> '1' '3' '2' [0.50]
        A8 -> '5' '6' [0.50]
        A8 -> '6' '4' '5' [0.50]
        A9 -> '8' '7' '9' [0.50]
        A9 -> '8' '7' [0.50]
    """,

    "pcfg_cfg3b_disjoint_terminals_four_rules_different": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '2' '3' [0.50]
        A7 -> '1' '3' '2' [0.50]
        A8 -> '5' '6' [0.50]
        A8 -> '6' '4' '5' [0.50]
        A9 -> '8' '7' '9' [0.50]
        A9 -> '8' '7' [0.50]
    """,


    "pcfg_cfg3b_disjoint_terminals_five_rules_different": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '2' '3' [0.50]
        A7 -> '1' '3' '2' [0.50]
        A8 -> '5' '6' [0.50]
        A8 -> '6' '4' '5' [0.50]
        A9 -> '8' '7' '9' [0.50]
        A9 -> '7' '8' [0.50]
    """,



    "pcfg_cfg3b_disjoint_terminals_latin": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> 'c' 'a' [0.50]
        A7 -> 'a' 'b' 'c' [0.50]
        A8 -> 'f' 'e' [0.50]
        A8 -> 'f' 'd' 'e' [0.50]
        A9 -> 'i' 'h' 'g' [0.50]
        A9 -> 'h' 'g' [0.50]
    """,

    "pcfg_cfg3b_eq_len_skewed_prob": """
        S -> A16 [1]
        A16 -> A15 A14 A13 [0.95]
        A16 -> A13 A15 A14 [0.05]
        A13 -> A11 A12 [0.95]
        A13 -> A12 A11 [0.05]
        A14 -> A11 A10 A12 [0.95]
        A14 -> A10 A11 A12 [0.05]
        A15 -> A12 A11 A10 [0.95]
        A15 -> A11 A12 A10 [0.05]
        A10 -> A7 A9 A8 [0.95]
        A10 -> A9 A8 A7 [0.05]
        A11 -> A8 A7 A9 [0.95]
        A11 -> A7 A8 A9 [0.05]
        A12 -> A8 A9 A7 [0.95]
        A12 -> A9 A7 A8 [0.05]
        A7 -> '3' '1' '2' [0.95]
        A7 -> '1' '2' '3' [0.05]
        A8 -> '6' '5' '4' [0.95]
        A8 -> '6' '4' '5' [0.05]
        A9 -> '9' '8' '7' [0.95]
        A9 -> '8' '7' '9' [0.05]
    """,


    "pcfg_cfg3b_eq_len_skewed_prob_0.90": """
        S -> A16 [1]
        A16 -> A15 A14 A13 [0.90]
        A16 -> A13 A15 A14 [0.10]
        A13 -> A11 A12 [0.90]
        A13 -> A12 A11 [0.10]
        A14 -> A11 A10 A12 [0.90]
        A14 -> A10 A11 A12 [0.10]
        A15 -> A12 A11 A10 [0.90]
        A15 -> A11 A12 A10 [0.10]
        A10 -> A7 A9 A8 [0.90]
        A10 -> A9 A8 A7 [0.10]
        A11 -> A8 A7 A9 [0.90]
        A11 -> A7 A8 A9 [0.10]
        A12 -> A8 A9 A7 [0.90]
        A12 -> A9 A7 A8 [0.10]
        A7 -> '3' '1' '2' [0.90]
        A7 -> '1' '2' '3' [0.10]
        A8 -> '6' '5' '4' [0.90]
        A8 -> '6' '4' '5' [0.10]
        A9 -> '9' '8' '7' [0.90]
        A9 -> '8' '7' '9' [0.10]
    """,


    "pcfg_cfg3b_eq_len_skewed_prob_0.75": """
        S -> A16 [1]
        A16 -> A15 A14 A13 [0.75]
        A16 -> A13 A15 A14 [0.25]
        A13 -> A11 A12 [0.75]
        A13 -> A12 A11 [0.25]
        A14 -> A11 A10 A12 [0.75]
        A14 -> A10 A11 A12 [0.25]
        A15 -> A12 A11 A10 [0.75]
        A15 -> A11 A12 A10 [0.25]
        A10 -> A7 A9 A8 [0.75]
        A10 -> A9 A8 A7 [0.25]
        A11 -> A8 A7 A9 [0.75]
        A11 -> A7 A8 A9 [0.25]
        A12 -> A8 A9 A7 [0.75]
        A12 -> A9 A7 A8 [0.25]
        A7 -> '3' '1' '2' [0.75]
        A7 -> '1' '2' '3' [0.25]
        A8 -> '6' '5' '4' [0.75]
        A8 -> '6' '4' '5' [0.25]
        A9 -> '9' '8' '7' [0.75]
        A9 -> '8' '7' '9' [0.25]
    """,


    "pcfg_cfg3b_eq_len_uniform_prob": """
        S -> A16 [1]
        A16 -> A15 A14 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' '2' [0.50]
        A7 -> '1' '2' '3' [0.50]
        A8 -> '6' '5' '4' [0.50]
        A8 -> '6' '4' '5' [0.50]
        A9 -> '9' '8' '7' [0.50]
        A9 -> '8' '7' '9' [0.50]
    """,

    "pcfg_cfg3b_disjoint_terminals_one_rule_missing": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [1]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.50]
        A7 -> '1' '2' '3' [0.50]
        A8 -> '6' '5' [0.50]
        A8 -> '6' '4' '5' [0.50]
        A9 -> '9' '8' '7' [0.50]
        A9 -> '8' '7' [0.50]
    """,


    "pcsg_csg3b_disjoint_terminals_A8_left": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.50]
        A7 -> '1' '2' '3' [0.50]
        A8 -> '6' '5' [0.50]
        A8 -> '6' '4' '5' [0.50]
        A9 -> '9' '8' '7' [0.50]
        A9 -> '8' '7' [0.50]


        A7 A8 -> A7 '5' '6' [0.50]
        A7 A8 -> A7 '5' '4' '6' [0.50]
    """,


    "pcsg_csg3b_disjoint_terminals_A8_right": """
        S -> A16 [1]
        A16 -> A15 A13 [0.50]
        A16 -> A13 A15 A14 [0.50]
        A13 -> A11 A12 [0.50]
        A13 -> A12 A11 [0.50]
        A14 -> A11 A10 A12 [0.50]
        A14 -> A10 A11 A12 [0.50]
        A15 -> A12 A11 A10 [0.50]
        A15 -> A11 A12 A10 [0.50]
        A10 -> A7 A9 A8 [0.50]
        A10 -> A9 A8 A7 [0.50]
        A11 -> A8 A7 A9 [0.50]
        A11 -> A7 A8 A9 [0.50]
        A12 -> A8 A9 A7 [0.50]
        A12 -> A9 A7 A8 [0.50]
        A7 -> '3' '1' [0.50]
        A7 -> '1' '2' '3' [0.50]
        A8 -> '6' '5' [0.50]
        A8 -> '6' '4' '5' [0.50]
        A9 -> '9' '8' '7' [0.50]
        A9 -> '8' '7' [0.50]


        A8 A7 -> '5' '6' A7 [0.50]
        A8 A7 -> '5' '4' '6' A7 [0.50]
    """,


    "preg_alphabet_2": """
        S -> A1 [0.5]
        S -> A2 [0.5]
        A1 -> 'a' S [0.9]
        A1 -> 'a'  [0.1]
        A2 -> 'b' S [0.9]
        A2 -> 'b'  [0.1]
    """,


    "preg_alphabet_7": """
        S -> A1 [0.142]
        S -> A2 [0.142]
        S -> A3 [0.142]
        S -> A4 [0.142]
        S -> A5 [0.142]
        S -> A6 [0.142]
        S -> A7 [0.142]
        A1 -> 'a' S [0.9]
        A1 -> 'a'  [0.1]
        A2 -> 'b' S [0.9]
        A2 -> 'b'  [0.1]
        A3 -> 'c' S [0.9]
        A3 -> 'c'  [0.1]
        A4 -> 'd' S [0.9]
        A4 -> 'd'  [0.1]
        A5 -> 'e' S [0.9]
        A5 -> 'e'  [0.1]
        A6 -> 'f' S [0.9]
        A6 -> 'f'  [0.1]
        A7 -> 'g' S [0.9]
        A7 -> 'g'  [0.1]
    """,



    "preg_alphabet_26": """
        S -> A1 [0.0384]
        S -> A2 [0.0384]
        S -> A3 [0.0384]
        S -> A4 [0.0384]
        S -> A5 [0.0384]
        S -> A6 [0.0384]
        S -> A7 [0.0384]
        S -> A8 [0.0384]
        S -> A9 [0.0384]
        S -> A10 [0.0384]
        S -> A11 [0.0384]
        S -> A12 [0.0384]
        S -> A13 [0.0384]
        S -> A14 [0.0384]
        S -> A15 [0.0384]
        S -> A16 [0.0384]
        S -> A17 [0.0384]
        S -> A18 [0.0384]
        S -> A19 [0.0384]
        S -> A20 [0.0384]
        S -> A21 [0.0384]
        S -> A22 [0.0384]
        S -> A23 [0.0384]
        S -> A24 [0.0384]
        S -> A25 [0.0384]
        S -> A26 [0.0384]
        A1 -> 'a' S [0.9]
        A1 -> 'a'  [0.1]
        A2 -> 'b' S [0.9]
        A2 -> 'b'  [0.1]
        A3 -> 'c' S [0.9]
        A3 -> 'c'  [0.1]
        A4 -> 'd' S [0.9]
        A4 -> 'd'  [0.1]
        A5 -> 'e' S [0.9]
        A5 -> 'e'  [0.1]
        A6 -> 'f' S [0.9]
        A6 -> 'f'  [0.1]
        A7 -> 'g' S [0.9]
        A7 -> 'g'  [0.1]
        A8 -> 'h' S [0.9]
        A8 -> 'h'  [0.1]
        A9 -> 'i' S [0.9]
        A9 -> 'i'  [0.1]
        A10 -> 'j' S [0.9]
        A10 -> 'j'  [0.1]
        A11 -> 'k' S [0.9]
        A11 -> 'k'  [0.1]
        A12 -> 'l' S [0.9]
        A12 -> 'l'  [0.1]
        A13 -> 'm' S [0.9]
        A13 -> 'm'  [0.1]
        A14 -> 'n' S [0.9]
        A14 -> 'n'  [0.1]
        A15 -> 'o' S [0.9]
        A15 -> 'o'  [0.1]
        A16 -> 'p' S [0.9]
        A16 -> 'p'  [0.1]
        A17 -> 'q' S [0.9]
        A17 -> 'q'  [0.1]
        A18 -> 'r' S [0.9]
        A18 -> 'r'  [0.1]
        A19 -> 's' S [0.9]
        A19 -> 's'  [0.1]
        A20 -> 't' S [0.9]
        A20 -> 't'  [0.1]
        A21 -> 'u' S [0.9]
        A21 -> 'u'  [0.1]
        A22 -> 'v' S [0.9]
        A22 -> 'v'  [0.1]
        A23 -> 'w' S [0.9]
        A23 -> 'w'  [0.1]
        A24 -> 'x' S [0.9]
        A24 -> 'x'  [0.1]
        A25 -> 'y' S [0.9]
        A25 -> 'y'  [0.1]
        A26 -> 'z' S [0.9]
        A26 -> 'z'  [0.1]
    """,


    "preg_alphabet_combined": """
        S -> S_2 [0.3333]
        S -> S_7 [0.3333]
        S -> S_26 [0.3333]
        S_2 -> A_2_1 [0.5]
        S_2 -> A_2_2 [0.5]
        A_2_1 -> 'a' S_2 [0.9]
        A_2_1 -> 'a'  [0.1]
        A_2_2 -> 'b' S_2 [0.9]
        A_2_2 -> 'b'  [0.1]
        S_7 -> A_7_1 [0.142]
        S_7 -> A_7_2 [0.142]
        S_7 -> A_7_3 [0.142]
        S_7 -> A_7_4 [0.142]
        S_7 -> A_7_5 [0.142]
        S_7 -> A_7_6 [0.142]
        S_7 -> A_7_7 [0.142]
        A_7_1 -> 'a' S_7 [0.9]
        A_7_1 -> 'a'  [0.1]
        A_7_2 -> 'b' S_7 [0.9]
        A_7_2 -> 'b'  [0.1]
        A_7_3 -> 'c' S_7 [0.9]
        A_7_3 -> 'c'  [0.1]
        A_7_4 -> 'd' S_7 [0.9]
        A_7_4 -> 'd'  [0.1]
        A_7_5 -> 'e' S_7 [0.9]
        A_7_5 -> 'e'  [0.1]
        A_7_6 -> 'f' S_7 [0.9]
        A_7_6 -> 'f'  [0.1]
        A_7_7 -> 'g' S_7 [0.9]
        A_7_7 -> 'g'  [0.1]
        S_26 -> A_26_1 [0.0384]
        S_26 -> A_26_2 [0.0384]
        S_26 -> A_26_3 [0.0384]
        S_26 -> A_26_4 [0.0384]
        S_26 -> A_26_5 [0.0384]
        S_26 -> A_26_6 [0.0384]
        S_26 -> A_26_7 [0.0384]
        S_26 -> A_26_8 [0.0384]
        S_26 -> A_26_9 [0.0384]
        S_26 -> A_26_10 [0.0384]
        S_26 -> A_26_11 [0.0384]
        S_26 -> A_26_12 [0.0384]
        S_26 -> A_26_13 [0.0384]
        S_26 -> A_26_14 [0.0384]
        S_26 -> A_26_15 [0.0384]
        S_26 -> A_26_16 [0.0384]
        S_26 -> A_26_17 [0.0384]
        S_26 -> A_26_18 [0.0384]
        S_26 -> A_26_19 [0.0384]
        S_26 -> A_26_20 [0.0384]
        S_26 -> A_26_21 [0.0384]
        S_26 -> A_26_22 [0.0384]
        S_26 -> A_26_23 [0.0384]
        S_26 -> A_26_24 [0.0384]
        S_26 -> A_26_25 [0.0384]
        S_26 -> A_26_26 [0.0384]
        A_26_1 -> 'a' S_26 [0.9]
        A_26_1 -> 'a'  [0.1]
        A_26_2 -> 'b' S_26 [0.9]
        A_26_2 -> 'b'  [0.1]
        A_26_3 -> 'c' S_26 [0.9]
        A_26_3 -> 'c'  [0.1]
        A_26_4 -> 'd' S_26 [0.9]
        A_26_4 -> 'd'  [0.1]
        A_26_5 -> 'e' S_26 [0.9]
        A_26_5 -> 'e'  [0.1]
        A_26_6 -> 'f' S_26 [0.9]
        A_26_6 -> 'f'  [0.1]
        A_26_7 -> 'g' S_26 [0.9]
        A_26_7 -> 'g'  [0.1]
        A_26_8 -> 'h' S_26 [0.9]
        A_26_8 -> 'h'  [0.1]
        A_26_9 -> 'i' S_26 [0.9]
        A_26_9 -> 'i'  [0.1]
        A_26_10 -> 'j' S_26 [0.9]
        A_26_10 -> 'j'  [0.1]
        A_26_11 -> 'k' S_26 [0.9]
        A_26_11 -> 'k'  [0.1]
        A_26_12 -> 'l' S_26 [0.9]
        A_26_12 -> 'l'  [0.1]
        A_26_13 -> 'm' S_26 [0.9]
        A_26_13 -> 'm'  [0.1]
        A_26_14 -> 'n' S_26 [0.9]
        A_26_14 -> 'n'  [0.1]
        A_26_15 -> 'o' S_26 [0.9]
        A_26_15 -> 'o'  [0.1]
        A_26_16 -> 'p' S_26 [0.9]
        A_26_16 -> 'p'  [0.1]
        A_26_17 -> 'q' S_26 [0.9]
        A_26_17 -> 'q'  [0.1]
        A_26_18 -> 'r' S_26 [0.9]
        A_26_18 -> 'r'  [0.1]
        A_26_19 -> 's' S_26 [0.9]
        A_26_19 -> 's'  [0.1]
        A_26_20 -> 't' S_26 [0.9]
        A_26_20 -> 't'  [0.1]
        A_26_21 -> 'u' S_26 [0.9]
        A_26_21 -> 'u'  [0.1]
        A_26_22 -> 'v' S_26 [0.9]
        A_26_22 -> 'v'  [0.1]
        A_26_23 -> 'w' S_26 [0.9]
        A_26_23 -> 'w'  [0.1]
        A_26_24 -> 'x' S_26 [0.9]
        A_26_24 -> 'x'  [0.1]
        A_26_25 -> 'y' S_26 [0.9]
        A_26_25 -> 'y'  [0.1]
        A_26_26 -> 'z' S_26 [0.9]
        A_26_26 -> 'z'  [0.1]

    """,
    
    # S -> S_2 [0.64]
    # S -> S_7 [0.22]
    # S -> S_26 [0.14]

    # "preg_alphabet_combined_skewed_prob": """
    #     S -> S_2 [0.33]
    #     S -> S_7 [0.33]
    #     S -> S_26 [0.33]
    #     S_2 -> A_2_1 [0.5]
    #     S_2 -> A_2_2 [0.5]
    #     A_2_1 -> 'a' S_2 [0.9]
    #     A_2_1 -> 'a'  [0.1]
    #     A_2_2 -> 'b' S_2 [0.9]
    #     A_2_2 -> 'b'  [0.1]
    #     S_7 -> A_7_1 [0.142]
    #     S_7 -> A_7_2 [0.142]
    #     S_7 -> A_7_3 [0.142]
    #     S_7 -> A_7_4 [0.142]
    #     S_7 -> A_7_5 [0.142]
    #     S_7 -> A_7_6 [0.142]
    #     S_7 -> A_7_7 [0.142]
    #     A_7_1 -> 'a' S_7 [0.9]
    #     A_7_1 -> 'a'  [0.1]
    #     A_7_2 -> 'b' S_7 [0.9]
    #     A_7_2 -> 'b'  [0.1]
    #     A_7_3 -> 'c' S_7 [0.9]
    #     A_7_3 -> 'c'  [0.1]
    #     A_7_4 -> 'd' S_7 [0.9]
    #     A_7_4 -> 'd'  [0.1]
    #     A_7_5 -> 'e' S_7 [0.9]
    #     A_7_5 -> 'e'  [0.1]
    #     A_7_6 -> 'f' S_7 [0.9]
    #     A_7_6 -> 'f'  [0.1]
    #     A_7_7 -> 'g' S_7 [0.9]
    #     A_7_7 -> 'g'  [0.1]
    #     S_26 -> A_26_1 [0.0384]
    #     S_26 -> A_26_2 [0.0384]
    #     S_26 -> A_26_3 [0.0384]
    #     S_26 -> A_26_4 [0.0384]
    #     S_26 -> A_26_5 [0.0384]
    #     S_26 -> A_26_6 [0.0384]
    #     S_26 -> A_26_7 [0.0384]
    #     S_26 -> A_26_8 [0.0384]
    #     S_26 -> A_26_9 [0.0384]
    #     S_26 -> A_26_10 [0.0384]
    #     S_26 -> A_26_11 [0.0384]
    #     S_26 -> A_26_12 [0.0384]
    #     S_26 -> A_26_13 [0.0384]
    #     S_26 -> A_26_14 [0.0384]
    #     S_26 -> A_26_15 [0.0384]
    #     S_26 -> A_26_16 [0.0384]
    #     S_26 -> A_26_17 [0.0384]
    #     S_26 -> A_26_18 [0.0384]
    #     S_26 -> A_26_19 [0.0384]
    #     S_26 -> A_26_20 [0.0384]
    #     S_26 -> A_26_21 [0.0384]
    #     S_26 -> A_26_22 [0.0384]
    #     S_26 -> A_26_23 [0.0384]
    #     S_26 -> A_26_24 [0.0384]
    #     S_26 -> A_26_25 [0.0384]
    #     S_26 -> A_26_26 [0.0384]
    #     A_26_1 -> 'a' S_26 [0.9]
    #     A_26_1 -> 'a'  [0.1]
    #     A_26_2 -> 'b' S_26 [0.9]
    #     A_26_2 -> 'b'  [0.1]
    #     A_26_3 -> 'c' S_26 [0.9]
    #     A_26_3 -> 'c'  [0.1]
    #     A_26_4 -> 'd' S_26 [0.9]
    #     A_26_4 -> 'd'  [0.1]
    #     A_26_5 -> 'e' S_26 [0.9]
    #     A_26_5 -> 'e'  [0.1]
    #     A_26_6 -> 'f' S_26 [0.9]
    #     A_26_6 -> 'f'  [0.1]
    #     A_26_7 -> 'g' S_26 [0.9]
    #     A_26_7 -> 'g'  [0.1]
    #     A_26_8 -> 'h' S_26 [0.9]
    #     A_26_8 -> 'h'  [0.1]
    #     A_26_9 -> 'i' S_26 [0.9]
    #     A_26_9 -> 'i'  [0.1]
    #     A_26_10 -> 'j' S_26 [0.9]
    #     A_26_10 -> 'j'  [0.1]
    #     A_26_11 -> 'k' S_26 [0.9]
    #     A_26_11 -> 'k'  [0.1]
    #     A_26_12 -> 'l' S_26 [0.9]
    #     A_26_12 -> 'l'  [0.1]
    #     A_26_13 -> 'm' S_26 [0.9]
    #     A_26_13 -> 'm'  [0.1]
    #     A_26_14 -> 'n' S_26 [0.9]
    #     A_26_14 -> 'n'  [0.1]
    #     A_26_15 -> 'o' S_26 [0.9]
    #     A_26_15 -> 'o'  [0.1]
    #     A_26_16 -> 'p' S_26 [0.9]
    #     A_26_16 -> 'p'  [0.1]
    #     A_26_17 -> 'q' S_26 [0.9]
    #     A_26_17 -> 'q'  [0.1]
    #     A_26_18 -> 'r' S_26 [0.9]
    #     A_26_18 -> 'r'  [0.1]
    #     A_26_19 -> 's' S_26 [0.9]
    #     A_26_19 -> 's'  [0.1]
    #     A_26_20 -> 't' S_26 [0.9]
    #     A_26_20 -> 't'  [0.1]
    #     A_26_21 -> 'u' S_26 [0.9]
    #     A_26_21 -> 'u'  [0.1]
    #     A_26_22 -> 'v' S_26 [0.9]
    #     A_26_22 -> 'v'  [0.1]
    #     A_26_23 -> 'w' S_26 [0.9]
    #     A_26_23 -> 'w'  [0.1]
    #     A_26_24 -> 'x' S_26 [0.9]
    #     A_26_24 -> 'x'  [0.1]
    #     A_26_25 -> 'y' S_26 [0.9]
    #     A_26_25 -> 'y'  [0.1]
    #     A_26_26 -> 'z' S_26 [0.9]
    #     A_26_26 -> 'z'  [0.1]

    # """,
    

    "preg_numeral_2": """
        S -> A1 [0.5]
        S -> A2 [0.5]
        A1 -> '0' S [0.9]
        A1 -> '0'  [0.1]
        A2 -> '1' S [0.9]
        A2 -> '1'  [0.1]
    """,


    "preg_numeral_7": """
        S -> A1 [0.142]
        S -> A2 [0.142]
        S -> A3 [0.142]
        S -> A4 [0.142]
        S -> A5 [0.142]
        S -> A6 [0.142]
        S -> A7 [0.142]
        A1 -> '0' S [0.9]
        A1 -> '0'  [0.1]
        A2 -> '1' S [0.9]
        A2 -> '1'  [0.1]
        A3 -> '2' S [0.9]
        A3 -> '2'  [0.1]
        A4 -> '3' S [0.9]
        A4 -> '3'  [0.1]
        A5 -> '4' S [0.9]
        A5 -> '4'  [0.1]
        A6 -> '5' S [0.9]
        A6 -> '5'  [0.1]
        A7 -> '6' S [0.9]
        A7 -> '6'  [0.1]
    """,

    "preg_numeral_10": """
        S -> A1 [0.1]
        S -> A2 [0.1]
        S -> A3 [0.1]
        S -> A4 [0.1]
        S -> A5 [0.1]
        S -> A6 [0.1]
        S -> A7 [0.1]
        S -> A8 [0.1]
        S -> A9 [0.1]
        S -> A10 [0.1]
        A1 -> '0' S [0.9]
        A1 -> '0'  [0.1]
        A2 -> '1' S [0.9]
        A2 -> '1'  [0.1]
        A3 -> '2' S [0.9]
        A3 -> '2'  [0.1]
        A4 -> '3' S [0.9]
        A4 -> '3'  [0.1]
        A5 -> '4' S [0.9]
        A5 -> '4'  [0.1]
        A6 -> '5' S [0.9]
        A6 -> '5'  [0.1]
        A7 -> '6' S [0.9]
        A7 -> '6'  [0.1]
        A8 -> '7' S [0.9]
        A8 -> '7'  [0.1]
        A9 -> '8' S [0.9]
        A9 -> '8'  [0.1]
        A10 -> '9' S [0.9]
        A10 -> '9'  [0.1]
    """,


    "pcfg_4_3_1_2_3_4_5_6_7_8_9_latin": """
        S -> S_5 [1]
        S_5 -> B_4 C_1_1 E_4 T_1_1 [0.25]
        S_5 -> B_4 C_1_2 E_4 T_1_2 [0.25]
        S_5 -> B_4 C_1_3 E_4 T_1_3 [0.25]
        S_5 -> B_4 C_1_4 E_4 T_1_4 [0.25]
        B_4 -> B_3 [0.3333]
        B_4 -> B_3 B_3 B_3 [0.3333]
        B_4 -> B_3 B_3 [0.3333]
        B_3 -> B_2 [0.3333]
        B_3 -> B_2 [0.3333]
        B_3 -> B_2 B_2 [0.3333]
        B_2 -> B_1 [0.3333]
        B_2 -> B_1 [0.3333]
        B_2 -> B_1 B_1 B_1 [0.3333]
        B_1 -> 'b' 'i' 'c' [0.3333]
        B_1 -> 'i' 'f' 'a' [0.3333]
        B_1 -> 'a' 'h' 'f' 'b' [0.3333]
        E_4 -> E_3 [0.3333]
        E_4 -> E_3 E_3 [0.3333]
        E_4 -> E_3 E_3 E_3 [0.3333]
        E_3 -> E_2 [0.3333]
        E_3 -> E_2 E_2 [0.3333]
        E_3 -> E_2 [0.3333]
        E_2 -> E_1 E_1 [0.3333]
        E_2 -> E_1 [0.3333]
        E_2 -> E_1 E_1 E_1 [0.3333]
        E_1 -> 'e' 'f' [0.3333]
        E_1 -> 'a' 'h' 'f' 'f' [0.3333]
        E_1 -> 'a' 'e' 'a' 'e' 'e' 'i' [0.3333]
        T_1_1 -> 'a' [1]
        T_1_2 -> 'b' [1]
        T_1_3 -> 'c' [1]
        T_1_4 -> 'd' [1]
        C_1_1 -> 'e' [1]
        C_1_2 -> 'f' [1]
        C_1_3 -> 'g' [1]
        C_1_4 -> 'h' [1]
        C_1_5 -> 'i' [1]
    """,



    "pcfg_4_3_1_2_3_4_5_6_7_8_9": """
        S -> S_5 [1]
        S_5 -> B_4 C_1_1 E_4 T_1_1 [0.25]
        S_5 -> B_4 C_1_2 E_4 T_1_2 [0.25]
        S_5 -> B_4 C_1_3 E_4 T_1_3 [0.25]
        S_5 -> B_4 C_1_4 E_4 T_1_4 [0.25]
        B_4 -> B_3 [0.3333]
        B_4 -> B_3 B_3 B_3 [0.3333]
        B_4 -> B_3 B_3 [0.3333]
        B_3 -> B_2 [0.3333]
        B_3 -> B_2 [0.3333]
        B_3 -> B_2 B_2 [0.3333]
        B_2 -> B_1 [0.3333]
        B_2 -> B_1 [0.3333]
        B_2 -> B_1 B_1 B_1 [0.3333]
        B_1 -> '2' '9' '3' [0.3333]
        B_1 -> '9' '6' '1' [0.3333]
        B_1 -> '1' '8' '6' '2' [0.3333]
        E_4 -> E_3 [0.3333]
        E_4 -> E_3 E_3 [0.3333]
        E_4 -> E_3 E_3 E_3 [0.3333]
        E_3 -> E_2 [0.3333]
        E_3 -> E_2 E_2 [0.3333]
        E_3 -> E_2 [0.3333]
        E_2 -> E_1 E_1 [0.3333]
        E_2 -> E_1 [0.3333]
        E_2 -> E_1 E_1 E_1 [0.3333]
        E_1 -> '5' '6' [0.3333]
        E_1 -> '1' '8' '6' '6' [0.3333]
        E_1 -> '1' '5' '1' '5' '5' '9' [0.3333]
        T_1_1 -> '1' [1]
        T_1_2 -> '2' [1]
        T_1_3 -> '3' [1]
        T_1_4 -> '4' [1]
        C_1_1 -> '5' [1]
        C_1_2 -> '6' [1]
        C_1_3 -> '7' [1]
        C_1_4 -> '8' [1]
        C_1_5 -> '9' [1]
    """,


    "pcfg_4_3_1_2_3_4_5_6_7_8_9_skewed_0.5": """
        S -> S_5 [1]
        S_5 -> B_4 C_1_1 E_4 T_1_1 [0.25]
        S_5 -> B_4 C_1_2 E_4 T_1_2 [0.25]
        S_5 -> B_4 C_1_3 E_4 T_1_3 [0.25]
        S_5 -> B_4 C_1_4 E_4 T_1_4 [0.25]
        B_4 -> B_3 [0.25]
        B_4 -> B_3 B_3 B_3 [0.5]
        B_4 -> B_3 B_3 [0.25]
        B_3 -> B_2 [0.25]
        B_3 -> B_2 [0.5]
        B_3 -> B_2 B_2 [0.25]
        B_2 -> B_1 [0.25]
        B_2 -> B_1 [0.5]
        B_2 -> B_1 B_1 B_1 [0.25]
        B_1 -> '2' '9' '3' [0.25]
        B_1 -> '9' '6' '1' [0.5]
        B_1 -> '1' '8' '6' '2' [0.25]
        E_4 -> E_3 [0.25]
        E_4 -> E_3 E_3 [0.5]
        E_4 -> E_3 E_3 E_3 [0.25]
        E_3 -> E_2 [0.25]
        E_3 -> E_2 E_2 [0.5]
        E_3 -> E_2 [0.25]
        E_2 -> E_1 E_1 [0.25]
        E_2 -> E_1 [0.5]
        E_2 -> E_1 E_1 E_1 [0.25]
        E_1 -> '5' '6' [0.25]
        E_1 -> '1' '8' '6' '6' [0.5]
        E_1 -> '1' '5' '1' '5' '5' '9' [0.25]
        T_1_1 -> '1' [1]
        T_1_2 -> '2' [1]
        T_1_3 -> '3' [1]
        T_1_4 -> '4' [1]
        C_1_1 -> '5' [1]
        C_1_2 -> '6' [1]
        C_1_3 -> '7' [1]
        C_1_4 -> '8' [1]
        C_1_5 -> '9' [1]
    """,


    "pcfg_4_3_1_2_3_4_5_6_7_8_9_skewed_0.8": """
        S -> S_5 [1]
        S_5 -> B_4 C_1_1 E_4 T_1_1 [0.25]
        S_5 -> B_4 C_1_2 E_4 T_1_2 [0.25]
        S_5 -> B_4 C_1_3 E_4 T_1_3 [0.25]
        S_5 -> B_4 C_1_4 E_4 T_1_4 [0.25]
        B_4 -> B_3 [0.1]
        B_4 -> B_3 B_3 B_3 [0.8]
        B_4 -> B_3 B_3 [0.1]
        B_3 -> B_2 [0.1]
        B_3 -> B_2 [0.8]
        B_3 -> B_2 B_2 [0.1]
        B_2 -> B_1 [0.1]
        B_2 -> B_1 [0.8]
        B_2 -> B_1 B_1 B_1 [0.1]
        B_1 -> '2' '9' '3' [0.1]
        B_1 -> '9' '6' '1' [0.8]
        B_1 -> '1' '8' '6' '2' [0.1]
        E_4 -> E_3 [0.1]
        E_4 -> E_3 E_3 [0.8]
        E_4 -> E_3 E_3 E_3 [0.1]
        E_3 -> E_2 [0.1]
        E_3 -> E_2 E_2 [0.8]
        E_3 -> E_2 [0.1]
        E_2 -> E_1 E_1 [0.1]
        E_2 -> E_1 [0.8]
        E_2 -> E_1 E_1 E_1 [0.1]
        E_1 -> '5' '6' [0.1]
        E_1 -> '1' '8' '6' '6' [0.8]
        E_1 -> '1' '5' '1' '5' '5' '9' [0.1]
        T_1_1 -> '1' [1]
        T_1_2 -> '2' [1]
        T_1_3 -> '3' [1]
        T_1_4 -> '4' [1]
        C_1_1 -> '5' [1]
        C_1_2 -> '6' [1]
        C_1_3 -> '7' [1]
        C_1_4 -> '8' [1]
        C_1_5 -> '9' [1]
    """,



    "pcfg_4_3_1_2_3_4_5_6_7_8_9_skewed_0.95": """
        S -> S_5 [1]
        S_5 -> B_4 C_1_1 E_4 T_1_1 [0.25]
        S_5 -> B_4 C_1_2 E_4 T_1_2 [0.25]
        S_5 -> B_4 C_1_3 E_4 T_1_3 [0.25]
        S_5 -> B_4 C_1_4 E_4 T_1_4 [0.25]
        B_4 -> B_3 [0.025]
        B_4 -> B_3 B_3 B_3 [0.95]
        B_4 -> B_3 B_3 [0.025]
        B_3 -> B_2 [0.025]
        B_3 -> B_2 [0.95]
        B_3 -> B_2 B_2 [0.025]
        B_2 -> B_1 [0.025]
        B_2 -> B_1 [0.95]
        B_2 -> B_1 B_1 B_1 [0.025]
        B_1 -> '2' '9' '3' [0.025]
        B_1 -> '9' '6' '1' [0.95]
        B_1 -> '1' '8' '6' '2' [0.025]
        E_4 -> E_3 [0.025]
        E_4 -> E_3 E_3 [0.95]
        E_4 -> E_3 E_3 E_3 [0.025]
        E_3 -> E_2 [0.025]
        E_3 -> E_2 E_2 [0.95]
        E_3 -> E_2 [0.025]
        E_2 -> E_1 E_1 [0.025]
        E_2 -> E_1 [0.95]
        E_2 -> E_1 E_1 E_1 [0.025]
        E_1 -> '5' '6' [0.025]
        E_1 -> '1' '8' '6' '6' [0.95]
        E_1 -> '1' '5' '1' '5' '5' '9' [0.025]
        T_1_1 -> '1' [1]
        T_1_2 -> '2' [1]
        T_1_3 -> '3' [1]
        T_1_4 -> '4' [1]
        C_1_1 -> '5' [1]
        C_1_2 -> '6' [1]
        C_1_3 -> '7' [1]
        C_1_4 -> '8' [1]
        C_1_5 -> '9' [1]
    """,



    "pcfg_4_3_1_2_3_4_5_6_7_8_9_eq_len_uniform_prob": """
        S -> S_5 [1]
        S_5 -> B_4 C_1_1 E_4 T_1_1 [0.25]
        S_5 -> B_4 C_1_2 E_4 T_1_2 [0.25]
        S_5 -> B_4 C_1_3 E_4 T_1_3 [0.25]
        S_5 -> B_4 C_1_4 E_4 T_1_4 [0.25]
        B_4 -> B_3 [0.3333]
        B_4 -> B_3 B_3 B_3 [0.3333]
        B_4 -> B_3 B_3 [0.3333]
        B_3 -> B_2 [0.3333]
        B_3 -> B_2 [0.3333]
        B_3 -> B_2 B_2 [0.3333]
        B_2 -> B_1 [0.3333]
        B_2 -> B_1 [0.3333]
        B_2 -> B_1 B_1 B_1 [0.3333]
        B_1 -> '2' '9' '3' [0.3333]
        B_1 -> '9' '6' '1' [0.3333]
        B_1 -> '1' '8' '6' [0.3333]
        E_4 -> E_3 [0.3333]
        E_4 -> E_3 E_3 [0.3333]
        E_4 -> E_3 E_3 E_3 [0.3333]
        E_3 -> E_2 [0.3333]
        E_3 -> E_2 E_2 [0.3333]
        E_3 -> E_2 [0.3333]
        E_2 -> E_1 E_1 [0.3333]
        E_2 -> E_1 [0.3333]
        E_2 -> E_1 E_1 E_1 [0.3333]
        E_1 -> '5' '6' '5' '9' [0.3333]
        E_1 -> '1' '8' '6' '6' [0.3333]
        E_1 -> '1' '5' '1' '5' [0.3333]
        T_1_1 -> '1' [1]
        T_1_2 -> '2' [1]
        T_1_3 -> '3' [1]
        T_1_4 -> '4' [1]
        C_1_1 -> '5' [1]
        C_1_2 -> '6' [1]
        C_1_3 -> '7' [1]
        C_1_4 -> '8' [1]
        C_1_5 -> '9' [1]
    """,


    "pcfg_4_3_1_2_3_4_5_6_7_8_9_eq_len_skewed_prob_0.80": """
        S -> S_5 [1]
        S_5 -> B_4 C_1_1 E_4 T_1_1 [0.25]
        S_5 -> B_4 C_1_2 E_4 T_1_2 [0.25]
        S_5 -> B_4 C_1_3 E_4 T_1_3 [0.25]
        S_5 -> B_4 C_1_4 E_4 T_1_4 [0.25]
        B_4 -> B_3 [0.3333]
        B_4 -> B_3 B_3 B_3 [0.3333]
        B_4 -> B_3 B_3 [0.3333]
        B_3 -> B_2 [0.3333]
        B_3 -> B_2 [0.3333]
        B_3 -> B_2 B_2 [0.3333]
        B_2 -> B_1 [0.3333]
        B_2 -> B_1 [0.3333]
        B_2 -> B_1 B_1 B_1 [0.3333]
        B_1 -> '2' '9' '3' [0.80]
        B_1 -> '9' '6' '1' [0.10]
        B_1 -> '1' '8' '6' [0.10]
        E_4 -> E_3 [0.3333]
        E_4 -> E_3 E_3 [0.3333]
        E_4 -> E_3 E_3 E_3 [0.3333]
        E_3 -> E_2 [0.3333]
        E_3 -> E_2 E_2 [0.3333]
        E_3 -> E_2 [0.3333]
        E_2 -> E_1 E_1 [0.3333]
        E_2 -> E_1 [0.3333]
        E_2 -> E_1 E_1 E_1 [0.3333]
        E_1 -> '5' '6' '5' '9' [0.80]
        E_1 -> '1' '8' '6' '6' [0.10]
        E_1 -> '1' '5' '1' '5' [0.10]
        T_1_1 -> '1' [1]
        T_1_2 -> '2' [1]
        T_1_3 -> '3' [1]
        T_1_4 -> '4' [1]
        C_1_1 -> '5' [1]
        C_1_2 -> '6' [1]
        C_1_3 -> '7' [1]
        C_1_4 -> '8' [1]
        C_1_5 -> '9' [1]
    """,

    "pcfg_4_3_1_2_3_4_5_6_7_8_9_eq_len_skewed_prob": """
        S -> S_5 [1]
        S_5 -> B_4 C_1_1 E_4 T_1_1 [0.25]
        S_5 -> B_4 C_1_2 E_4 T_1_2 [0.25]
        S_5 -> B_4 C_1_3 E_4 T_1_3 [0.25]
        S_5 -> B_4 C_1_4 E_4 T_1_4 [0.25]
        B_4 -> B_3 [0.3333]
        B_4 -> B_3 B_3 B_3 [0.3333]
        B_4 -> B_3 B_3 [0.3333]
        B_3 -> B_2 [0.3333]
        B_3 -> B_2 [0.3333]
        B_3 -> B_2 B_2 [0.3333]
        B_2 -> B_1 [0.3333]
        B_2 -> B_1 [0.3333]
        B_2 -> B_1 B_1 B_1 [0.3333]
        B_1 -> '2' '9' '3' [0.95]
        B_1 -> '9' '6' '1' [0.025]
        B_1 -> '1' '8' '6' [0.025]
        E_4 -> E_3 [0.3333]
        E_4 -> E_3 E_3 [0.3333]
        E_4 -> E_3 E_3 E_3 [0.3333]
        E_3 -> E_2 [0.3333]
        E_3 -> E_2 E_2 [0.3333]
        E_3 -> E_2 [0.3333]
        E_2 -> E_1 E_1 [0.3333]
        E_2 -> E_1 [0.3333]
        E_2 -> E_1 E_1 E_1 [0.3333]
        E_1 -> '5' '6' '5' '9' [0.95]
        E_1 -> '1' '8' '6' '6' [0.025]
        E_1 -> '1' '5' '1' '5' [0.025]
        T_1_1 -> '1' [1]
        T_1_2 -> '2' [1]
        T_1_3 -> '3' [1]
        T_1_4 -> '4' [1]
        C_1_1 -> '5' [1]
        C_1_2 -> '6' [1]
        C_1_3 -> '7' [1]
        C_1_4 -> '8' [1]
        C_1_5 -> '9' [1]
    """,



    "pcfg_4_3_1_2_3_4_5_6_7_8_9_eq_len_all_rules_skewed_prob": """
        S -> S_5 [1]
        S_5 -> B_4 C_1_1 E_4 T_1_1 [0.25]
        S_5 -> B_4 C_1_2 E_4 T_1_2 [0.25]
        S_5 -> B_4 C_1_3 E_4 T_1_3 [0.25]
        S_5 -> B_4 C_1_4 E_4 T_1_4 [0.25]
        B_4 -> B_3 [0.90]
        B_4 -> B_3 B_3 B_3 [0.05]
        B_4 -> B_3 B_3 [0.05]
        B_3 -> B_2 [0.90]
        B_3 -> B_2 [0.05]
        B_3 -> B_2 B_2 [0.05]
        B_2 -> B_1 [0.90]
        B_2 -> B_1 [0.05]
        B_2 -> B_1 B_1 B_1 [0.05]
        B_1 -> '2' '9' '3' [0.90]
        B_1 -> '9' '6' '1' [0.05]
        B_1 -> '1' '8' '6' [0.05]
        E_4 -> E_3 [0.90]
        E_4 -> E_3 E_3 [0.05]
        E_4 -> E_3 E_3 E_3 [0.05]
        E_3 -> E_2 [0.90]
        E_3 -> E_2 E_2 [0.05]
        E_3 -> E_2 [0.05]
        E_2 -> E_1 E_1 [0.90]
        E_2 -> E_1 [0.05]
        E_2 -> E_1 E_1 E_1 [0.05]
        E_1 -> '5' '6' '5' '9' [0.90]
        E_1 -> '1' '8' '6' '6' [0.05]
        E_1 -> '1' '5' '1' '5' [0.05]
        T_1_1 -> '1' [1]
        T_1_2 -> '2' [1]
        T_1_3 -> '3' [1]
        T_1_4 -> '4' [1]
        C_1_1 -> '5' [1]
        C_1_2 -> '6' [1]
        C_1_3 -> '7' [1]
        C_1_4 -> '8' [1]
        C_1_5 -> '9' [1]
    """,









}

grammar_details_dict = {
    "pcfg_cfg3b_disjoint_terminals": {
        "level_to_nonterminals": {
            4: [Nonterminal("A16")],
            3: [Nonterminal("A15"), Nonterminal("A14"), Nonterminal("A13")],
            2: [Nonterminal("A12"), Nonterminal("A11"), Nonterminal("A10")],
            1: [Nonterminal("A9"), Nonterminal("A8"), Nonterminal("A7")],
        },
        "nonterminal_to_level": {
            Nonterminal("S"): -100,
            Nonterminal("A16"): 4,
            Nonterminal("A15"): 3,
            Nonterminal("A14"): 3,
            Nonterminal("A13"): 3,
            Nonterminal("A12"): 2,
            Nonterminal("A11"): 2,
            Nonterminal("A10"): 2,
            Nonterminal("A9"): 1,
            Nonterminal("A8"): 1,
            Nonterminal("A7"): 1,
        }
    },

    
}

grammar_details_dict["pcfg_cfg3b_disjoint_terminals_latin"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]
grammar_details_dict["pcfg_cfg3b_disjoint_terminals_skewed_prob"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]
grammar_details_dict["pcfg_cfg3b_disjoint_terminals_all_rules_0.55"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]
grammar_details_dict["pcfg_cfg3b_disjoint_terminals_all_rules_0.60"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]
grammar_details_dict["pcfg_cfg3b_disjoint_terminals_all_rules_0.70"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]
grammar_details_dict["pcfg_cfg3b_disjoint_terminals_all_rules_0.80"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]
grammar_details_dict["pcfg_cfg3b_disjoint_terminals_all_rules_0.90"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]
grammar_details_dict["pcfg_cfg3b_disjoint_terminals_all_rules_0.95"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]
grammar_details_dict["pcfg_cfg3b_disjoint_terminals_one_rule_different"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]
grammar_details_dict["pcfg_cfg3b_disjoint_terminals_two_rules_different"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]
grammar_details_dict["pcfg_cfg3b_disjoint_terminals_three_rules_different"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]
grammar_details_dict["pcfg_cfg3b_disjoint_terminals_four_rules_different"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]
grammar_details_dict["pcfg_cfg3b_disjoint_terminals_five_rules_different"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]


grammar_details_dict["pcfg_cfg3b_eq_len_skewed_prob"] = grammar_details_dict["pcfg_cfg3b_disjoint_terminals"]



def skew_distribution(probs, skewness):
    """
    Skew a probability distribution using the skew-normal distribution.

    :param probs: List of probabilities (must sum to 1)
    :param skewness: Skew factor (positive = right skew, negative = left skew, 0 = unchanged)
    :return: Skewed probability distribution
    """
    n = len(probs)  # Number of items
    if skewness == 0:
        return np.array(probs)  # No skew, return original

    x = np.linspace(-1, 1, n)  # Symmetric range
    skewed_vals = skewnorm.pdf(x, skewness)  # Generate skewed values
    skewed_probs = skewed_vals / np.sum(skewed_vals)  # Normalize to sum to 1
    return skewed_probs


def hierarchical_cfg(max_depth, 
                     max_breadth, 
                     production_per_non_terminal,
                     skewness, 
                     terminals,
                     seed=10):
    assert max_depth >= 1
    assert max_breadth >= 1
    assert production_per_non_terminal >= 1
    assert isinstance(skewness, float)
    assert isinstance(terminals, list)
    num_terminals = len(terminals)

    non_terminal_counter = 1
    non_terminal_symbol = 'A'
    productions = [] # a list of tuple: 1st entry is a non-terminal lhs, 2nd entry is a list of terminal/non-terminal rhs, and 3rd entry is the probability of the production
    depth_to_non_terminal = {}
    non_terminal_to_depth = {}

    random.seed(seed)

    for depth in range(1, max_depth+1):
        for i in range(max_breadth):
            prob_list = [1/production_per_non_terminal for _ in range(production_per_non_terminal)]
            prob_list = skew_distribution(prob_list, skewness)
            prob_list = [round(prob, 4) for prob in prob_list]
            for j in range(production_per_non_terminal):
                lhs = f"{non_terminal_symbol}_{non_terminal_counter}"
                if depth == 1:
                    rhs = random.choices(terminals, k=random.randint(1, max_breadth))
                    rhs = [f"'{terminal}'" for terminal in rhs]
                else:
                    rhs = random.choices(depth_to_non_terminal[depth-1], k=random.randint(1, max_breadth))
                
                productions.append(
                    (lhs, rhs, prob_list[j])
                )
            if depth not in depth_to_non_terminal:
                depth_to_non_terminal[depth] = []
            depth_to_non_terminal[depth].append(f"{non_terminal_symbol}_{non_terminal_counter}")
            non_terminal_to_depth[f"{non_terminal_symbol}_{non_terminal_counter}"] = depth
            if depth != max_depth:
                non_terminal_counter += 1
            else:
                break

    # starting production rule
    productions.insert(
        0, 
        ("S", [f"{non_terminal_symbol}_{non_terminal_counter}"], 1)
    )
            

    grammar = f"{productions[0][0]} -> {' '.join(productions[0][1])} [{productions[0][2]}]\n"
    for production in productions[::-1][:-1]:
        grammar += f"{production[0]} -> {' '.join(production[1])} [{production[2]}]\n"


    return grammar




def hierarchical_hcfg_double_branch(depth, 
                                    breadth,
                                    production_per_non_terminal, 
                                    skewness, 
                                    terminals=["1", "2", "3", "4"], 
                                    seed=10):

    assert isinstance(depth, int)
    assert isinstance(breadth, int)
    assert depth > 0
    assert breadth > 0
    assert production_per_non_terminal > 0
    assert len(terminals) > 2
    assert isinstance(skewness, float)

    # print(f"Depth: {depth}, Breadth: {breadth}, Terminals: {terminals}")
    

    random.seed(seed)
    num_terminals = len(terminals)
    terminal_t_list = terminals[:num_terminals//2]
    terminal_c_list = terminals[num_terminals//2:]
    
    # separator between two hierarchical grammar rules
    terminal_t_rules = []   
    terminal_c_rules = []
    for i, terminal in enumerate(terminal_t_list):
        terminal_t_rules.append(f"T_1_{i+1} -> '{terminal}' [1]")
    for i, terminal in enumerate(terminal_c_list):
        terminal_c_rules.append(f"C_1_{i+1} -> '{terminal}' [1]")
    

    u_dict = {
        "b" : [],
        "e" : []
    }

    for i in range(breadth*2):
        length = random.randint(1, breadth*2-1)
        s = random.choices(terminals, k=length)
        u_dict["b"].append(s + random.choices(terminal_t_list, k=1))
        u_dict["e"].append(s + random.choices(terminal_c_list, k=1))
    
    
    def recursive_grammar_builder(depth, type, breadth, production_per_non_terminal):
        assert type in ["b", "e"]
        assert production_per_non_terminal >= 1
        non_terminal = f"B_{depth}" if type == "b" else f"E_{depth}"
        
        prob_list = [1/production_per_non_terminal for _ in range(production_per_non_terminal)]
        prob_list = skew_distribution(prob_list, skewness)
        prob_list = [round(prob, 4) for prob in prob_list]
        

        if depth == 0:
            return []
        elif depth == 1:
            rules = []
            for i, s in enumerate(random.choices(u_dict[type], k=production_per_non_terminal)):
                s = " ".join(f"'{terminal}'" for terminal in s)
                rules.append(f"{non_terminal} -> {s} [{prob_list[i]}]")
            return rules
        else:
            
            non_terminals_child = [f"B_{depth-1}" if type == "b" else f"E_{depth-1}" for i in range(breadth)]
            rules = []
            for i in range(production_per_non_terminal):
                rules.append(f"{non_terminal} -> {' '.join(random.choices(non_terminals_child, k=random.randint(1, breadth)))} [{prob_list[i]}]")
            rules.extend(recursive_grammar_builder(depth-1, type, breadth, production_per_non_terminal))
            return rules



    start_rule = [
        f"S -> S_{depth+1} [1]",
    ]

    for i in range(num_terminals//2):
        start_rule.append(f"S_{depth+1} -> B_{depth} C_1_{i+1} E_{depth} T_1_{i+1} [{round(1/(num_terminals//2), 4)}]")

    rule_builder = []
    rule_builder.extend(start_rule)
    rule_builder.extend(recursive_grammar_builder(depth, "b", breadth, production_per_non_terminal))
    rule_builder.extend(recursive_grammar_builder(depth, "e", breadth, production_per_non_terminal))
    rule_builder.extend(terminal_t_rules)
    rule_builder.extend(terminal_c_rules)


    return "\n".join(rule_builder)




# print("\n".join(hierarchical_hcfg_double_branch(6, 3, 0)))










# def hierarchical_hcfg_double_branch(depth, breadth, seed=10):
#     assert isinstance(depth, int)
#     assert isinstance(breadth, int)
#     assert depth > 0
#     assert breadth > 0

#     terminal_t_list = ['1', '2']
#     terminal_c_list = ['3', '4']
#     terminal_list = terminal_t_list + terminal_c_list
#     u_dict = {
#         "b" : [],
#         "e" : []
#     }

#     random.seed(seed)
#     terminal_t_rules = []   
#     terminal_c_rules = []
#     for i, terminal in enumerate(terminal_t_list):
#         terminal_t_rules.append(f"T{i+1} -> '{terminal}' [1]")
#     for i, terminal in enumerate(terminal_c_list):
#         terminal_c_rules.append(f"C{i+1} -> '{terminal}' [1]")
    
#     for i in range(breadth*2):
#         len = random.randint(1, breadth*2-1)
#         s = random.choices(terminal_list, k=len)
#         u_dict["b"].append(s + random.choices(terminal_t_list, k=1))
#         u_dict["e"].append(s + random.choices(terminal_c_list, k=1))
    
#     # print(u_dict)
#     # print(terminal_t_rules)
#     # print(terminal_c_rules)

#     def recursive_grammar_builder(depth, type, breadth=3):
#         # print("Called with depth", depth, "type", type, "breadth", breadth)
#         assert type in ["b", "e"]
#         assert breadth >= 1 and breadth <= 3
#         non_terminal = f"B_{depth}" if type == "b" else f"E_{depth}"
#         if depth == 0:
#             return []
#         elif depth == 1:
#             rules = []
#             for i, s in enumerate(random.choices(u_dict[type], k=breadth)):
#                 s = " ".join(f"'{terminal}'" for terminal in s)
#                 rules.append(f"{non_terminal}_{i+1} -> {s} [1]")
#             return rules
#         else:
            
#             non_terminals_child = [f"B_{depth-1}_{i+1}" if type == "b" else f"E_{depth-1}_{i+1}" for i in range(breadth)]
#             rules = []
#             for i in range(breadth):
#                 # rules.append(f"{non_terminal}_{i+1} -> {' '.join(random.choices(non_terminals_child, k=random.randint(1, breadth)))} [{round(1/breadth, 4)}]")
#                 rules.append(f"{non_terminal}_{i+1} -> {' '.join(random.choices(non_terminals_child, k=random.randint(1, breadth)))} [1]")
#             rules.extend(recursive_grammar_builder(depth-1, type, breadth))
#             return rules
        
#     start_rule = [
#         f"S -> S_{depth+1} [1]",
#         f"S_{depth+1} -> S_{depth+1}_{1} T1 [0.5]",
#         f"S_{depth+1} -> S_{depth+1}_{2} T2 [0.5]",
#     ]

#     s_rule = [
#         f"S_{depth+1}_1 -> B_{depth} C1 E_{depth} [1]",
#         f"S_{depth+1}_2 -> B_{depth} C2 E_{depth} [1]",
#     ]
    
#     b_rule = [f"B_{depth} -> B_{depth}_{i+1} [{round(1/breadth, 4)}]" for i in range(breadth)]
#     e_rule = [f"E_{depth} -> E_{depth}_{i+1} [{round(1/breadth, 4)}]" for i in range(breadth)]

#     # print("Start Rule:")
#     # print(start_rule)

#     # print("G Rule:")
#     # print(g_rule)


#     # print()
#     # print(list(recursive_grammar_builder(depth, "b")))
#     # print()
#     # print(recursive_grammar_builder(depth, "e"))

#     rule_builder = []
#     rule_builder.extend(start_rule)
#     rule_builder.extend(s_rule)
#     rule_builder.extend(b_rule)
#     rule_builder.extend(e_rule)
#     rule_builder.extend(recursive_grammar_builder(depth, "b"))
#     rule_builder.extend(recursive_grammar_builder(depth, "e"))
#     rule_builder.extend(terminal_t_rules)
#     rule_builder.extend(terminal_c_rules)

#     # print(rule_builder)

#     return "\n".join(rule_builder)




# # print("\n".join(hierarchical_hcfg_double_branch(6, 3, 0)))



