import numpy as np
import torch


class AbsoluteLengthDifference:
    def __init__(self):
        pass

    def __call__(self, generated_text, target_text):
        """
        A dummy reward function.
        Replace this with a metric that evaluates the correctness or quality of reasoning.
        """
        min_val = -2000
        max_val = 1
        # Example: negative absolute difference in length (for demonstration only)
        length_difference = np.char.str_len(generated_text) - np.char.str_len(
            target_text
        )
        rewards = -torch.abs(torch.tensor(length_difference, dtype=torch.float32))
        norm_rewards = (rewards - min_val) / (max_val - min_val)
        return rewards, norm_rewards
