using Convex
#using SCS
using Random
# using Flux
using Zygote
using BenchmarkTools
using JuMP
using MathOptInterface
using Clarabel

optimizer = Convex.MOI.OptimizerWithAttributes(Clarabel.Optimizer, "verbose" => 0)
# Set random seed for reproducibility
Random.seed!(0)

# Constants
epsilon = 1e-4
beta = 0.1
eta_s = 0.1
eta_l = 1.1
slope_epsilon = 1e-1
MAX_INNER_EPOCHS = 10^4
MAX_OUTER_EPOCHS = 10^3

# Objective function
function f(x)
    return 2*x[1]+4*x[2]+x[3]
end 


# Inner minimization using Convex.jl
function get_x_watson(u)
    x_var = Variable(3)
    objective = 2*x_var[1]+4*x_var[2]+x_var[3]
    constraints = [g_u(x_var, u, j) <= 0. for j in 1:size(u,1)]
    push!(constraints,x_var <= 1.)
    push!(constraints,-x_var <= 1e-5)
    problem = minimize(objective, constraints)
    solve!(problem, optimizer)

    return vec(evaluate(x_var))
end
Zygote.@nograd get_x_watson

# Constraint functions for barrier method
function g_u(x,t,j)
    result = 0.0

    # First term
    if t[j,1] > 0
        term1 = (1 - x[1]) * ((1 / t[j,1]) * 
                exp(-1 * (1 + (t[j,2] - 1)^2) / t[j,1]))
    else
        term1 = 0
    end
    result += term1

    # Second term
    if t[j,1] > 0
        term2 = (1 - x[2]) * ((1 / t[j,1]) * 
                exp(-1 * (8 + t[j,2]^2) / (4 * t[j,1])))
    else
        term2 = 0
    end
    result += term2

    # Third term
    if t[j,1] > 2
        term3 = (1 - x[3]) * ((1 / (t[j,1] - 2)) * 
                exp(-1 * (1 + (t[j,2] + 1)^2) / (t[j,1] - 2)))
    else
        term3 = 0
    end
    result += term3

    # Subtract 0.5 as per the constraint
    return result - 0.5
end

function safe_log(x)
    return log(max(x, 1e-10))
end

function barrier(x, t, alpha)
    constraint_values = [-g_u(x, t, j) for j in 1:size(t,1)]
    return alpha * f(x)- sum(safe_log.(constraint_values))
end


function find_alpha(x_, u_)
    gradient_x_f = Zygote.gradient(f, x_)[1][1]
    result = 0.0
    for i in 1:size(u_)[1]
        grad_component = Zygote.gradient(g_u, x_, u_, i)[1][1]
        result += grad_component / g_u(x_, u_, i)
    end
    
    return (1/gradient_x_f) * result
end

# Inner minimization function
function inner_min(u)
    x = get_x_watson(copy(u))
    alpha = find_alpha(copy(x),copy(u))
    grad = Zygote.gradient(barrier, x,u,alpha)
    f_val_xmin = f(x)
    println("f(y_min) = ", f_val_xmin)
    println("x = ", x)
    return grad[2],alpha
end


function run()
    u = rand(30,2)  # Random initial u
    alpha = 1e1
    u_prev = copy(u)
    clip_valueL = -1.0 
    clip_valueU = 4.0 
    
    for epoch in 1:MAX_OUTER_EPOCHS
        lr_u = 1e-1  # Update outer learning rate here

        grad_u,alpha = inner_min(u)
        # loss_value_u(u) = barrier(x, u, alpha)
        # grad_u = gradient(loss_value_u, u)[1]

        u .= u .+ lr_u .* grad_u /alpha
        u .= clamp.(u, clip_valueL, clip_valueU)
        println("Grad u: ", grad_u/alpha)

        if norm(grad_u) < 1e-3
            println("Final u: ", u, "Grad u: ", grad_u)
            break
        else
            u_prev .= u
        end
    end
end

# Execute the optimization
t0 = @benchmark run()
println(t0)
# run()