import math

# def compute_score(is_correct, response_len, correct_proportion, min_correct_length, max_correct_length, alpha = 0.5):
#     L_expect = (2*correct_proportion - correct_proportion**2) * min_correct_length + (1 - correct_proportion)**2 * max_correct_length
#
#     # 设置σ参数（使用比例法）
#     k = 2.0  # 可调参数
#     sigma = L_expect / k
#
#     # 计算长度奖励（0-1范围）
#     length_penalty = (response_len - L_expect) ** 2
#     length_reward = math.exp(-length_penalty / (2 * sigma ** 2))  # 自动在(0,1]内
#
#     return is_correct+ alpha*length_reward

def compute_score(is_correct, response_len, correct_proportion, min_correct_length, max_correct_length, alpha = 0.01):
    L_expect = correct_proportion**2 * min_correct_length + (1 - correct_proportion**2) * max_correct_length
    # 设置σ参数（使用比例法）
    k = 3.0  # 可调参数
    sigma = L_expect / k

    # 计算长度奖励（0-1范围）
    length_penalty = (response_len - L_expect) ** 2
    length_reward = math.exp(-length_penalty / (2 * sigma ** 2))  # 自动在(0,1]内

    return is_correct+ alpha*correct_proportion*length_reward, is_correct, alpha*correct_proportion*length_reward