import pandas as pd

data1 = pd.read_parquet("/mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/data/l1/deepscaler-add1k_8k_nov.parquet")
data2 = pd.read_parquet("/mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/data/l1/deepscaler_qwen3_polaris_add1k_new.parquet")

different = 0
different_list = []
acc_list = []
for i in range(len(data1)):
    if data1.iloc[i]['reward_model']['num_tokens'] != data2.iloc[i]['reward_model']['num_tokens']:
        # print(i, data1.iloc[i]['reward_model']['num_tokens'])
        # print(data2.iloc[i]['reward_model']['num_tokens'])
        # print("-" * 100)
        different += 1
        different_list.append(data2.iloc[i]['reward_model']['num_tokens'])
        acc_list.append(data2.iloc[i]['extra_info']['ori_acc'])
        # breakpoint()
print(different)


# 统计 different_list 的分布
from collections import Counter
import numpy as np

if different_list:
    counter = Counter(different_list)
    print("\n不同值的分布:")
    for value, count in sorted(counter.items()):
        print(f"  {value}: {count} 次 ({count/len(different_list)*100:.2f}%)")
    
    print(f"\n统计信息:")
    print(f"  总数: {len(different_list)}")
    print(f"  唯一值数量: {len(counter)}")
    count_less_than_8692 = sum(1 for x in different_list if x < 8192 + 500)
    print(f"  小于 8192 + 500 (8692) 的个数: {count_less_than_8692} ({count_less_than_8692/len(different_list)*100:.2f}%)")

else:
    print("\n没有不同的值")

print(np.mean(acc_list))