from datasets import load_dataset
import pandas as pd
import random
from collections import Counter

# dataset = load_dataset("Elliott/Openr1-Math-46k-8192", split="train")
# with open("/fs-computility/prime/wangfuting/rl/LUFFY/data/l1/train_8k_exact.parquet", "r") as f:
dataset =load_dataset("/mnt/shared-storage-user/p1-shared/wangfuting/shared/data/datasets--zwhe99--DeepMath-103K", split="train")


easy = dataset.filter(lambda x: x['difficulty'] <= 5.0)      # ~30,586条 (29.7%)
medium = dataset.filter(lambda x: 5.0 < x['difficulty'] <= 6.5)  # ~39,044条 (37.9%)
hard = dataset.filter(lambda x: x['difficulty'] > 6.5)       # ~33,392条 (32.4%)



system_prompt = 'Your task is to follow a systematic, thorough reasoning process before providing the final solution. This involves analyzing, summarizing, exploring, reassessing, and refining your thought process through multiple iterations. Structure your response into two sections: Thought and Solution. In the Thought section, present your reasoning using the format: "<think>\n {thoughts} </think>\n". Each thought should include detailed analysis, brainstorming, verification, and refinement of ideas. After "</think>\n," in the Solution section, provide the final, logical, and accurate answer, clearly derived from the exploration in the Thought section. If applicable, include the answer in \\boxed{} for closed-form results like multiple choices or mathematical solutions.'


def process_split(data):
    results = []
    for i, item in enumerate(data):
        random_number = random.randint(100, 8192)
        saved_data = {
            "data_source": "",
            "prompt": [
                {"role": 'system', 'content': system_prompt + f" Think for {random_number} tokens."},
                { "role": "user", "content": item["question"]}
                ],
            "ability": "math",
            "reward_model": {
                "style": "rule",
                "ground_truth": item["final_answer"],
                "num_tokens": random_number
               
            },
            "extra_info": {
                'split': '',
                'index': i,
                'difficulty': item['difficulty']
            }
        }
        results.append(saved_data)
    train_df = pd.DataFrame(results)
    return train_df


        
        
easy_df = process_split(easy)
print("Easy:", len(easy))
print(easy_df.iloc[0]['prompt'])
easy_df.to_parquet("deepmath/easy_0-5.parquet")

medium_df = process_split(medium)
print("Medium:", len(medium_df))
print(medium_df.iloc[0]['prompt'])
medium_df.to_parquet("deepmath/medium_5-6.5.parquet")

hard_df = process_split(easy)
print("Hard:", len(hard_df))
print(hard_df.iloc[0]['prompt'])
hard_df.to_parquet("deepmath/hard_6.5-10.parquet")