using Convex
#using SCS
using Random
# using Flux
using Zygote
using BenchmarkTools
using JuMP
using MathOptInterface
using Clarabel

optimizer = Convex.MOI.OptimizerWithAttributes(Clarabel.Optimizer, "verbose" => 0)
# Set random seed for reproducibility
Random.seed!(0)

# Constants
epsilon = 1e-4
beta = 0.1
eta_s = 0.1
eta_l = 1.1
slope_epsilon = 1e-1
MAX_INNER_EPOCHS = 10^4
MAX_OUTER_EPOCHS = 10^5

# Objective function
function f(x)
    return (x[1] + x[2] - 2)^2 + (x[1] - x[2])^2 + 30 * (min(0, x[1] - x[2]))^2
end

# Constraint functions for Convex.jl
function g_u_cvx(x_var, t, j)
    return x_var[1] * cos(t[j]) + x_var[2] * sin(t[j]) - 1.0
end

# Inner minimization using Convex.jl
function get_x_watson(u)
    x_var = Variable(2)
    objective = square(x_var[1] + x_var[2] - 2) + square(x_var[1] - x_var[2]) + 30 * square(max(0, -(x_var[1] - x_var[2])))
    constraints = [g_u_cvx(x_var, u, j) <= -1e-5 for j in 1:length(u)]
    problem = minimize(objective, constraints)
    solve!(problem, optimizer)
    return evaluate(x_var)
end

Zygote.@nograd get_x_watson

# Constraint functions for barrier method
function g_u(x, t, j)
    return x[1] * cos(t[j]) + x[2] * sin(t[j]) - 1.0
end

function safe_log(x)
    return log(max(x, 1e-10))
end

function barrier(x, t, alpha)
    constraint_values = [-g_u(x, t, 1) ,-g_u(x, t, 2)]
    return alpha *f(x) - sum(log.(constraint_values))
end

function inner_min(u)
    lr_x = 1e-10
    x = get_x_watson(copy(u))
    alpha = find_alpha(copy(x),copy(u))
    
    # #loss_value_x(x) = barrier(x, u, alpha)
    # grad_x = Flux.gradient(x -> barrier(x, u, alpha), x)[1]
    
    ####################
    #grad_x = Zygote.gradient(barrier(x, u,alpha), x)[1]
    #x_new = x .- lr_x .* grad_x
    grad = Zygote.gradient(barrier, x,u,alpha)
    f_val_xmin = f(x)
    println("f(y_min) = ", f_val_xmin)
    println("x = ", x)

    #########################
    # f_val_xmin = f(x)
    # println("f(y_min) = ", f_val_xmin)
    # println("x = ", x)
    
    return alpha,grad[2] #,alpha
end


function find_alpha(x_, u_)
    gradient_x_f = Zygote.gradient(f, x_)[1][1]
    result = 0.0
    for i in 1:size(u_)[1]
        grad_component = Zygote.gradient(g_u, x_, u_, i)[1][1]
        result += grad_component / g_u(x_, u_, i)
    end
    
    alpha_temp = (1/gradient_x_f) * result
    if isnan(alpha_temp) || alpha_temp > 10^5
        alpha_temp = 10^5
    end
    
    return alpha_temp
end


# Main optimization loop
function run()
    u = [0.1 , 0.1]#rand(2)  # Random initial u
   
    u_prev = copy(u)
    clip_valueL = 0.0 
    clip_valueU = 2.0 
   
    for epoch in 1:MAX_OUTER_EPOCHS
        lr_u = 1e-1  # Update outer learning rate here

        #x = inner_min(u)
        #loss_value_u(u) = f(x)
        alpha, grad_u = inner_min(u)
        #loss_value_u(u) = inner_min(u)#barrier(x, u, alpha)
        #grad_u = Zygote.gradient(u -> inner_min(u), u)[1]
        println("Grad u: ", grad_u/alpha)
        u .= u .+ lr_u .* grad_u / alpha
        u .= clamp.(u, clip_valueL, clip_valueU)
        
        if norm(u .- u_prev) < 1e-3
            println("Final u: ", u, "Grad u: ", grad_u)
            break
        else
            u_prev .= u
        end
    end
end

# Execute the optimization
t0 = @benchmark run()
println(t0)

# run()