import json
import random
import copy
from pathlib import Path
import os
from vllm import LLM,SamplingParams
from tqdm import tqdm

prompt_template = """
You are a writing assistant skilled in various literary and rhetorical styles. 

Given the following question and its original response, rewrite the response in the specified style while preserving the original meaning.

---

Question:
{query}

Original Response:
{response}

Target Style: {style}

Now, generate a rewritten response in the {style} style.
""".strip()

def textfooler():
    pass


def styleAdv(llm,data_path,style,if_train=False):
    sampling_params = SamplingParams(temperature=1,max_tokens=1024)
    p = Path(data_path)
    filename = p.stem
    print(f"processing {filename} Style: {style} ")
    with open(data_path,'r',encoding='utf-8') as f:
        datas = json.load(f)
    random.seed(42)
    selected_samples = random.sample(datas, 128)

    styleAdv_batch = []
    if not if_train:
        for item in selected_samples:
            if item['good_response'] == "A":
                prompt = prompt_template.format(query=item['question'], response=item['response_A'], style=style)
            else:
                prompt = prompt_template.format(query=item['question'], response=item['response_B'], style=style)
            styleAdv_batch.append(prompt)
    elif if_train:
        for item in selected_samples:
            prompt = prompt_template.format(query=item['instruction'], response=item['chosen'], style=style)
            styleAdv_batch.append(prompt)
    
    new_style = []
    total = (len(styleAdv_batch) + 15) // 16
    for i in tqdm(range(0,len(styleAdv_batch),16),total=total):
        batch = styleAdv_batch[i:i+16]
        outputs = llm.generate(batch,sampling_params)
        for output in outputs:
            generated_text = output.outputs[0].text
            new_style.append(generated_text)
    
    if not if_train:
        for data, new in zip(selected_samples,new_style):
            if data['good_response'] == 'A':
                data['response_A'] = new
            elif data['good_response'] == 'B':
                data['response_B'] = new
    elif if_train:
        for data, new in zip(selected_samples,new_style):
            data['chosen'] = new
        
    save_path = f'/data/{filename}_style.json'
    with open(save_path, 'w', encoding='utf-8') as f:
        json.dump(selected_samples,f,indent=2,ensure_ascii=False)

def style_loop():
    model_path = '/path/to/model'
    os.environ['CUDA_VISIBLE_DEVICES'] = '0,1,2,3'
    llm = LLM(model=model_path,tensor_parallel_size=4)
    style_list = ['Shakespearean English', 'Biblical Prose', 'Journalistic', 'Stream of Consciousness', 'Satirical']
    data_list = [
        '/path/to/data'
    ]
    
    for data_path in data_list:
        style = random.choice(style_list)
        styleAdv(llm,data_path,style)
    style = random.choice(style_list)
    styleAdv(llm,'/path/to/train_data',style,True)



def RRM(data_path):
    p = Path(data_path)
    filename = p.stem
    with open(data_path,'r',encoding='utf-8') as f:
        datas = json.load(f)
        random.seed(42)
    
        selected_samples = random.sample(datas, 128)

        pool = datas.copy()

        rrm_samples = []
        for item in selected_samples:
            new_item = copy.deepcopy(item)
            other = random.choice([x for x in pool if x != item])
            if other["good_response"] == "B":
                alt_response = random.choice([other["response_A"], other["response_B"]])
            else:
                alt_response = other["response_A"]

            if item['good_response'] == 'A':
                new_item['response_B'] = alt_response
            elif item['good_response'] == 'B':
                new_item['response_A'] = alt_response
            else:
                continue 
            rrm_samples.append(new_item)

        save_path = f'/data/{filename}_RRM.json'
        with open(save_path, 'w', encoding='utf-8') as f:
            json.dump(rrm_samples, f, indent=2, ensure_ascii=False)

def RRM_train(data_path):
    p = Path(data_path)
    filename = p.stem
    with open(data_path,'r',encoding='utf-8') as f:
        datas = json.load(f)
        random.seed(42)
    
        selected_samples = random.sample(datas, 128)

        pool = datas.copy()

        rrm_samples = []
        for item in selected_samples:
            new_item = copy.deepcopy(item) 
            other = random.choice([x for x in pool if x != item])
            alt_response = other["chosen"]
            item['rejected'] == alt_response
            rrm_samples.append(new_item)

        save_path = f'/data/{filename}_RRM.json'

        with open(save_path, 'w', encoding='utf-8') as f:
            json.dump(rrm_samples, f, indent=2, ensure_ascii=False)

def RRM_process():
    data_list = [
        '/path/to/data'
    ]
    for path in data_list:
        RRM(path)
    RRM_train('/path/to/train_data')
    print("finished✅")

if __name__ == '__main__':
    RRM_process()
    style_loop()

