from datasets import load_dataset
import os

# Load the dataset (specify split if needed)
ds = load_dataset("guiugiuo/numia_prompt_ppo", split="train")

# Make sure output directory exists
os.makedirs("/home/USER/PRM_filter/data", exist_ok=True)

# Save to Parquet
ds.to_parquet("/home/USER/PRM_filter/data/numina_math/train_numina_raw.parquet")