import os
import json
import numpy as np

TAMPERING_HOME = os.getenv("TAMPERING_HOME")

model_code = "sarm-llama" # skywork-llama, sarm-llama, qrm-gemma, urm-llama
rewards_path = f"{TAMPERING_HOME}/datasets/hhrlhf/rm/test/hhrlhf_RM_1000_reward_{model_code}.json"

with open(rewards_path, "r") as f:
    rewards = json.load(f)

bias = []
unbiased = []
bias_win = 0
tie = 0
unbiased_win = 0

for item in rewards:
    unbiased.append(item["reward_1"])
    bias.append(item["reward_2"])
    if item["reward_2"] > item["reward_1"]:
        bias_win += 1
    elif item["reward_2"] == item["reward_1"]:
        tie += 1
    else:
        unbiased_win += 1
        
bias_win /= len(rewards)
tie /= len(rewards)
unbiased_win /= len(rewards)
 
print("=" * 100)
print("Reward model: ", model_code)
print("=" * 100)
print("Reward stats")
print(f"Total mean reward: {np.mean(bias + unbiased):.2f}")
print(f"Total std reward: {np.std(bias + unbiased):.2f}")
print(f"Mean reward of bias: {np.mean(bias):.2f}")
print(f"Mean reward of unbiased: {np.mean(unbiased):.2f}")
print("=" * 100)
print("Win stats")
print(f"Number of bias win: {bias_win * 100:.2f}%")
print(f"Number of tie: {tie * 100:.2f}%")
print(f"Number of unbiased win: {unbiased_win * 100:.2f}%")
print("=" * 100)
print("Bias")
print(f"Biased win rate w/o tie: {bias_win / (bias_win + unbiased_win):.3f}")