from datasets import load_dataset
import pandas as pd
import random

# dataset = load_dataset("Elliott/Openr1-Math-46k-8192", split="train")
# with open("/fs-computility/prime/wangfuting/rl/LUFFY/data/l1/train_8k_exact.parquet", "r") as f:
dataset = pd.read_parquet("/mnt/shared-storage-user/p1-shared/wangfuting/codes/rl/LUFFY/data/l1/train_8k_exact.parquet")
# print(dataset[0])
# breakpoint()
prompts = []
for i in range(len(dataset)):
    current_prompt = dataset.iloc[i]['prompt']
    # random_number = random.randint(100, 8192)
    # breakpoint()
    
    parts = current_prompt[-1]["content"].split("Let's think step by step and output the final answer within \\boxed{}.")
    current_prompt = [{'content': 'Your task is to follow a systematic, thorough reasoning process before providing the final solution. This involves analyzing, summarizing, exploring, reassessing, and refining your thought process through multiple iterations. Structure your response into two sections: Thought and Solution. In the Thought section, present your reasoning using the format: "<think>\n {thoughts} </think>\n". Each thought should include detailed analysis, brainstorming, verification, and refinement of ideas. After "</think>\n," in the Solution section, provide the final, logical, and accurate answer, clearly derived from the exploration in the Thought section. If applicable, include the answer in \\boxed{} for closed-form results like multiple choices or mathematical solutions.' + parts[-1], 'role': 'system'}, {'content': parts[0].strip(), 'role': 'user'}] #" Let's think step by step and output the final answer within \\boxed{}."
    # instruction = "Let's think step by step and output the final answer within \\boxed{}."
    # instruction = f" {instruction} Think for {random_number} tokens."
    # item["prompt"][1]['content'] += instruction
    # item["reward_model"]["num_tokens"] =  random_number
    # item["prompt"] = [item["prompt"][-1]]
    # print( item["prompt"][0]['content'])
    prompts.append(current_prompt)
    # ret_dict.append(item)
dataset['prompt'] = prompts
print(dataset.iloc[0]['prompt'])
dataset.to_parquet("l1/train_8k_exact_luffy_style.parquet")

# val_df = pd.read_parquet("../data/valid.parquet")
# # 遍历每一行
# # 使用位置索引而不是标签索引
# for i in range(len(val_df)):
#     row = val_df.iloc[i]
#     print(f"Processing row: {i}")
    
#     current_prompt = row['prompt'].copy()
#     current_prompt[0]['content'] = """Your task is to provide a systematic reasoning approach for the given problem. Structure your response using the format: \"<guidance>\n {your guidance} </guidance>\n\". Focus on outlining the key analytical steps and overall methodology needed to solve the problem systematically."""
#     val_df.iloc[i, val_df.columns.get_loc('prompt')] = current_prompt
        
    
#     # 将修改后的整个结构赋值回去
    
# val_df.to_parquet("../data/valid_new.parquet")
# # breakpoint()