import json
import random
import pandas as pd
with open("/fs-computility/prime/wangfuting/rl/LUFFY/verl/recipe/l1/deepscaler/data/train/deepscaler.json", "r") as f:
    data = json.load(f)
random.shuffle(data)

# 取前 1000 个
sampled_data = data[:1000]
# sampled_data = data.sample(n=1000, random_state=42)
saved_data = []
for i, item in enumerate(sampled_data):
    question = item.pop('problem')
    answer = item.pop('answer')
    new_item = {
            "data_source": "",
            "prompt": [{"role" :"system", "content": "You are a helpful assistant."}, {
                "role": "user",
                "content": question
            }],
            "ability": "math",
            "reward_model": {
                "style": "rule",
                "ground_truth": answer,
               
            },
            "extra_info": {
                'split': '',
                'index': i
            }
        }
    saved_data.append(new_item)
train_df = pd.DataFrame(saved_data)
train_df.to_parquet('/fs-computility/prime/wangfuting/rl/LUFFY/data/l1/train_1k_sampled.parquet')
breakpoint()