import pandas as pd

data_path = "/mnt/shared-storage-user/p1-shared/wangfuting/codes/rl/LUFFY/data/openr1_our_style.parquet"
output_path = "/mnt/shared-storage-user/p1-shared/wangfuting/codes/rl/LUFFY/data/l1/openr1_our_style_add_1k.parquet"

data = pd.read_parquet(data_path)

for i in range(len(data)):
    row = data.iloc[i]
    print(f"Processing row: {i}")
    
    current_reward_model = row['reward_model'].copy()
    current_reward_model['num_tokens'] = current_reward_model['num_tokens'] + 1000
    
    data.at[i, 'reward_model'] = current_reward_model

data.to_parquet(output_path)