import gurobipy as gp
import numpy as np
from gurobipy import GRB


def compute_credits(agent_num, coalition_set, advantage, advantage_grand):
    batch_size = advantage.shape[1]
    solutions = []

    coalition_set = [list(coalition) for coalition in coalition_set]

    model = gp.Model()
    model.setParam('OutputFlag', 0)
    model.setParam('Threads', 1)
    model.setParam('Presolve', 2)
    model.setParam('Method', 1)
    model.setParam('OptimalityTol', 1e-9)
    model.setParam('FeasibilityTol', 1e-9)
    model.setParam('NumericFocus', 1)
    model.setParam('LogToConsole', 0)
    model.setParam('LogFile', '')

    eps = model.addVar(lb=0, vtype=GRB.CONTINUOUS, name="eps")
    x = model.addVars(range(agent_num), lb=-GRB.INFINITY, vtype=GRB.CONTINUOUS, name="x")
    y = model.addVars(range(agent_num), lb=0, vtype=GRB.CONTINUOUS, name="y")

    avg_x = gp.quicksum(x[i] for i in range(agent_num)) / agent_num
    obj = eps + 1e-4 * gp.quicksum(y[i] for i in range(agent_num)) / agent_num
    model.setObjective(obj, GRB.MINIMIZE)

    for i in range(agent_num):
        model.addConstr(x[i] - avg_x <= y[i], name=f"y_pos_{i}")
        model.addConstr(-(x[i] - avg_x) <= y[i], name=f"y_neg_{i}")

    constr = model.addConstrs(
        (gp.quicksum(x[i] for i in coalition_set[j]) + eps >= 0 for j in range(len(coalition_set))),
        name="c"
    )
    constr_grand = model.addConstr(gp.quicksum(x[i] for i in range(agent_num)) == 0, name="c_grand")

    model.update()

    if not isinstance(advantage, np.ndarray):
        advantage = np.array(advantage)
    if not isinstance(advantage_grand, np.ndarray):
        advantage_grand = np.array(advantage_grand)

    for b in range(batch_size):
        current_advantage = advantage[:, b]
        current_grand = advantage_grand[b]
        for j in range(len(coalition_set)):
            constr[j].RHS = current_advantage[j]
        constr_grand.RHS = current_grand

        if b > 0:
            last_solution = solutions[-1][:-1]
            mean_last = np.mean(last_solution)
            for i in range(agent_num):
                x[i].Start = last_solution[i]
                y[i].Start = abs(last_solution[i] - mean_last)
            eps.Start = solutions[-1][-1]

        model.optimize()

        if model.status == GRB.OPTIMAL:
            solution = [x[i].X for i in range(agent_num)] + [eps.X]
        else:
            solution = [0.0] * (agent_num + 1)

        solutions.append(solution)

    model.dispose()
    return np.array(solutions)
