
import numpy as np
import random
from copy import deepcopy

class Dataset_Generator:
    def __init__(self) -> None:
        self.id = 290  
        self.name =  'word_pattern'  
        self.description = "check if the string match the pattern"  
        self.url = "https://leetcode.com/problems/word-pattern/description/"
         
        self.rule = '''
def wordPattern(pattern, string):
        # Initialize words
        slist = string.split()
        sdict = {}
        consistence = True
        # Main Loop
        while len(pattern) != 0:
            if pattern[0] not in sdict:
                if slist[0] in sdict.values():
                    consistence = False
                    break
                else:
                    sdict[pattern[0]] = slist[0]
            else:
                if sdict[pattern[0]] != slist[0]:
                    consistence = False
                    break
            # Update
            pattern = pattern[1:]
            slist.pop(0)
        return consistence'''
        self.initialize = '''
1. Initialize words and pattern
pattern = "{}"
string = "{}"
```
slist = string.split()
sdict = {{}}
consistence = True
```
slist = string.split() = {}
2. Main Loop'''
        self.one_iteration_2_1_not_in_dict_not_in_values = '''
2.1 one iteration
```
while len(pattern) != 0:
```
pattern = "{}" != 0
enter
```
if pattern[0] not in sdict:
```
pattern[0] = "{}"
sdict = {}
pattern[0] not in sdict
enter
```
if slist[0] in sdict.values():
```
slist[0] = "{}"
sdict.values() = {}
slist[0] not in sdict.values()
do not enter
```
else:
    sdict[pattern[0]] = slist[0]
```
pattern[0] = "{}"
slist[0] = "{}"
sdict[pattern[0]] = slist[0] = "{}"'''
        self.one_iteration_2_1_not_in_keys_in_values = '''
2.1 one iteration
```
while len(pattern) != 0:
```
pattern = "{}" != 0
enter
```
if pattern[0] not in sdict:
```
pattern[0] = "{}"
sdict = {}
patterns[0] not in sdict
enter
```
if slist[0] in sdict.values():
```
slist[0] = "{}"
sdict.values() = {}
slist[0] in sdict.values()
enter
```
consistence = False
break
```
consistence = False
jump out of the loop'''
        self.one_iteration_2_1_in_dict_inconsistence = '''
2.1 one iteration
```
while len(pattern) != 0:
```
pattern = "{}" != 0
enter
```
if pattern[0] not in sdict:
```
pattern[0] = "{}"
sdict = {}
pattern[0] in sdict
do not enter
```
else:
    if sdict[pattern[0]] != slist[0]:
```
pattern[0] = "{}"
slist[0] = "{}"
sdict = {}
sdict[pattern[0]] = "{}" != slist[0]
enter
```
consistence = False
break
```
jump out of the loop'''
        self.one_iteration_2_1_in_dict_consistence = '''
2.1 one iteration
```
while len(pattern) != 0:
```
pattern = "{}" != 0
enter
```
if pattern[0] not in sdict:
```
pattern[0] = "{}"
sdict = {}
patterns[0] in sdict
do not enter
```
else:
    if sdict[pattern[0]] != slist[0]:
```
pattern[0] = "{}"
slist[0] = "{}"
sdict = {}
sdict[pattern[0]] = "{}" == slist[0]
do not enter'''
        self.one_iteration_2_2_updete_variables = '''
2.2 update variables
```
pattern = pattern[1:]
slist.pop(0)
```
pattern = "{}"
slist = {}'''
        self.complete_loop = '''
3. complete loop
```
while len(pattern) != 0:
```
pattern = ""
len(pattern) = 0
do not enter'''
        self.return_result = '''
4. Return Result
```
return consistence
```
consistence = {}
So the answer is {}.'''

    def gen_data_from_len(self, length: int) -> dict:
        pattern = ''.join(random.choices(['a','b'], k=length))
        string = (''.join(random.choices([' cat', ' dog'], k=length))).strip()
        question = f'A string s is "{string}", a string pattern is "{pattern}". Checking if s can be matched to pattern such that each letter in the pattern uniquely maps to exactly one word in s and vice versa, forming a bijection between letters and words.'
        slist = string.split()
        slist_bk = slist[:]
        pattern_bk = pattern[:]
        sdict = {}
        consistence = True
        while len(pattern_bk)!=0:
            if pattern_bk[0] not in sdict:
                if slist_bk[0] not in sdict.values():
                    sdict[pattern_bk[0]] = slist_bk[0]
                else:
                    consistence = False
                    break
            else:
                if sdict[pattern_bk[0]] != slist_bk[0]:
                    consistence = False
                    break
            pattern_bk = pattern_bk[1:]
            slist_bk.pop(0)
        gt = "Yes" if consistence else "No"
        return {"question": question,
                "gt": gt,
                "string": string,
                "pattern": pattern}
        
        '''
        return datapoint of given length
        
        return {...}
        '''
            
        
    def rfft_IO(self, data: dict) -> dict:
        instruction = "Follow the given rule to solve the question.\nrule:"
        '''
        data: a datapoint from gen_data_from_len
        return rfft input-output of given data
        
        return {"input": rfft_input,
                "output": rfft_output,
                "answer": ground_truth_answer}
        '''
        rule = self.rule
        input = instruction + rule + "\n\nQ: " + data["question"]
        # rfft output
        string = data["string"]
        pattern = data["pattern"]
        consistence = True
        slist = string.split()
        sdict = {}
        output = self.initialize.format(pattern, string, slist)
        while len(pattern) != 0:
            if pattern[0] not in sdict:
                if slist[0] not in sdict.values():
                    output += self.one_iteration_2_1_not_in_dict_not_in_values.format(pattern, pattern[0], sdict, slist[0],list(sdict.values()), pattern[0], slist[0], slist[0])
                    sdict[pattern[0]] = slist[0]
                else:
                    consistence = False
                    output += self.one_iteration_2_1_not_in_keys_in_values.format(pattern, pattern[0], sdict, slist[0], list(sdict.values()))
                    break
            else:
                if sdict[pattern[0]] != slist[0]:
                    consistence = False
                    output += self.one_iteration_2_1_in_dict_inconsistence.format(pattern, pattern[0], sdict, pattern[0], slist[0], sdict, sdict[pattern[0]])
                    break
                else:
                    output += self.one_iteration_2_1_in_dict_consistence.format(pattern, pattern[0], sdict, pattern[0], slist[0], sdict, sdict[pattern[0]])
            pattern = pattern[1:]
            slist.pop(0)
            output += self.one_iteration_2_2_updete_variables.format(pattern, slist)
        if len(pattern) == 0: 
            output += self.complete_loop
        answer = "Yes" if consistence else "No"
        output += self.return_result.format(consistence, answer)
        return {"input": input,
                "output": output,
                "answer": answer}


