# moral_hazard.py  (revised)
import torch
from torch import Tensor
from typing import Dict, Tuple, Union, Optional

Number = Union[float, int]

def _pick_sb(t: Tensor, s_index: int, b_index: int) -> Tuple[Tensor, Tensor]:
    """Extract (s, b) from arbitrary-shaped t using flat indices."""
    t_flat = t.flatten()
    if s_index >= t_flat.numel() or b_index >= t_flat.numel():
        raise IndexError(
            f"s_index={s_index} or b_index={b_index} out of bounds for t with {t_flat.numel()} elements."
        )
    return t_flat[s_index], t_flat[b_index]

def u1(
    a: Tensor,
    t: Tensor,
    *,
    r: float,
    c: float,
    sigma: float,
    s_index: int = 0,
    b_index: int = 1,
    **kwargs
) -> Tensor:
    """
    Principal's utility (LQ):
        u1(a,t) = a - 0.5 * r * b^2 * sigma^2 - 0.5 * c * a^2
    Works for arbitrary shapes of `a` and `t`. Reads b via index; s is unused here.
    """
    _, b = _pick_sb(t, s_index=s_index, b_index=b_index)
    r_t = torch.as_tensor(r, device=a.device, dtype=a.dtype)
    c_t = torch.as_tensor(c, device=a.device, dtype=a.dtype)
    sigma_t = torch.as_tensor(sigma, device=a.device, dtype=a.dtype)

    val = a - 0.5 * r_t * (b**2) * (sigma_t**2) - 0.5 * c_t * (a**2)
    return val if val.ndim == 0 else val.sum()

def u2(
    a: Tensor,
    t: Tensor,
    *,
    r: float,
    c: float,
    sigma: float,
    s_index: int = 0,
    b_index: int = 1,
    **kwargs
) -> Tensor:
    """
    Agent's utility (LQ):
        u2(a,t) = s + b a - 0.5 * r * b^2 * sigma^2 - 0.5 * c * a^2
    Works for arbitrary shapes; reads (s,b) via indices.
    """
    s, b = _pick_sb(t, s_index=s_index, b_index=b_index)
    r_t = torch.as_tensor(r, device=a.device, dtype=a.dtype)
    c_t = torch.as_tensor(c, device=a.device, dtype=a.dtype)
    sigma_t = torch.as_tensor(sigma, device=a.device, dtype=a.dtype)

    val = s + b * a - 0.5 * r_t * (b**2) * (sigma_t**2) - 0.5 * c_t * (a**2)
    return val if val.ndim == 0 else val.sum()

# -------- closed-form targets --------

def get_theoretical_optimum(
    t: Optional[torch.Tensor] = None,
    setting_parameters: Dict[str, Number] = None,
) -> Tuple[Union[float, torch.Tensor], Union[float, torch.Tensor], Union[float, torch.Tensor]]:
    """
    Closed-form optimum for the quadratic principal–agent model:

        u2(a,t) = s + b*a - 0.5 * r * b^2 * sigma^2 - 0.5 * c * a^2
        u1(a,t) = a         - 0.5 * r * b^2 * sigma^2 - 0.5 * c * a^2

    Participation binds: u2(a*, t*) = U_res.
    Returns (a_star, b_star, s_star); matches device/dtype of `t` if provided.
    """
    if setting_parameters is None:
        raise ValueError("`setting_parameters` dict must be provided.")

    r = float(setting_parameters["r"])
    c = float(setting_parameters["c"])
    sigma = float(setting_parameters["sigma"])
    U_res = float(setting_parameters["U_res"])

    if c <= 0:
        raise ValueError("Parameter `c` must be > 0.")
    if sigma < 0:
        raise ValueError("Parameter `sigma` must be >= 0.")
    if r < 0:
        raise ValueError("Parameter `r` must be >= 0.")

    denom = 1.0 + r * c * (sigma ** 2)
    denom = denom if denom > 0.0 else 1e-12

    b_star = 1.0 / denom
    a_star = b_star / c
    s_star = U_res - (b_star * a_star - 0.5 * r * (b_star ** 2) * (sigma ** 2) - 0.5 * c * (a_star ** 2))

    if isinstance(t, torch.Tensor):
        device, dtype = t.device, t.dtype
        a_star = torch.as_tensor(a_star, device=device, dtype=dtype)
        b_star = torch.as_tensor(b_star, device=device, dtype=dtype)
        s_star = torch.as_tensor(s_star, device=device, dtype=dtype)

    return a_star, b_star, s_star


def u1_min_at_optimum(
    t: Optional[torch.Tensor] = None,
    setting_parameters: Dict[str, Number] = None,
) -> Union[float, torch.Tensor]:
    """
    Convenience: returns u1(a*, t*) at the theoretical optimum (a*, b*, s*).
    """
    a_star, b_star, _ = get_theoretical_optimum(t=t, setting_parameters=setting_parameters)

    r = float(setting_parameters["r"])
    c = float(setting_parameters["c"])
    sigma = float(setting_parameters["sigma"])

    if isinstance(a_star, torch.Tensor):
        r_t = torch.as_tensor(r, device=a_star.device, dtype=a_star.dtype)
        c_t = torch.as_tensor(c, device=a_star.device, dtype=a_star.dtype)
        sigma_t = torch.as_tensor(sigma, device=a_star.device, dtype=a_star.dtype)
        return a_star - 0.5 * r_t * (b_star ** 2) * (sigma_t ** 2) - 0.5 * c_t * (a_star ** 2)
    else:
        return a_star - 0.5 * r * (b_star ** 2) * (sigma ** 2) - 0.5 * c * (a_star ** 2)
