function demo
randn('seed',1);
rand('seed',1);
clc;
clear;
close all;
% addpath('util');
% addpath('util');
n_set  = [300 500 1000 2000]; %dimension
r_set  = [5 10 20 30 50 100];   % rank
mu_set = [0.01 0.05 0.1 0.5 1 5 10 50];
ti_set = [10 30 50];

n_set  = [1500]; %dimension
r_set  = [10];   % rank
mu_set = [10];
ti_set = [10];

for it=1:length(ti_set)
    for id_n = 1:length(n_set)        % n  dimension
        for id_r = 1:length(r_set) % r  number of column
            for id_mu = 1:length(mu_set)
                
                n = n_set(id_n);
                r = r_set(id_r);
                mu = mu_set(id_mu);
                time_limit = ti_set(it);
                
                for i_rnd = 1:1  %times average.
                    fprintf('==============================================================================================\n');
                    
                    m = n;
                    B = randn(m,n);
                    seq = randperm(m*n,round(m*n*0.1));
%                     B(seq) = B(seq)*100;
 
                    A = -B'*B;
                   A = A / norm(A(:));

                    HandleObj = @(X) ComputeObj(X,A,mu);
                    fprintf('- n -- r -- mu --------\n');
                    fprintf('%4d %3d %3.3f \n',n,r,mu);
                    fprintf('----------------------------------------------------------------------------------\n');

                    X0 = proj_l2(randn(n,r),sqrt(r));
                    max_iter = 50000000;
                    tol = 1e-4;
                    inner_iter = 30;

%                     t00 = clock;
%                     [X1,his1,ts1] = DCA_SpectralGradient_Monotone(A,mu,r,X0,max_iter,time_limit);
%                     t1 = etime(clock,t00);
                    
%                     t0 = clock;
%                     [X1,his1,ts1] = ADMM_LineSearch(A,mu,r,X0,max_iter,time_limit);
%                     X1 = OrthProj(X1);
%                     t1 = etime(clock,t0);
%                     ddd
%                     t0 = clock;
%                     [X111,his111,ts111] = ADMM11(A,mu,r,X0,max_iter,time_limit);
%                     X111 = OrthProj(X111);
%                     t1 = etime(clock,t0);
%                                  
%                     plot(ts1,his1,ts111,his111);
%                     legend('method 1','method 2');
%                     HandleObj(X1)
%                     HandleObj(X111)      
%                     HandleObj(X1) -  HandleObj(X111)  
%                     ddd


                    

                  


                    
                    t0 = clock;
                    [X1,his1,ts1] = ADMM(A,mu,r,X0,max_iter,time_limit);
                    X1 = OrthProj(X1);
                    t1 = etime(clock,t0);
                    
                    
                                        t0 = clock;
                    [X2,his2,ts2] = DCA2_AdaptiveNesterov(A,mu,r,X0,max_iter,time_limit);
                    X2 = OrthProj(X2);
                    t2 = etime(clock,t0);
                    
                    

                    t0 = clock;
                    [X3,his3,ts3] = DCA2_AdaptiveNesterov_simple(A,mu,r,X0,max_iter,time_limit);
                    X3 = OrthProj(X3);
                    t3 = etime(clock,t0);
                    
                    
%                     
%                     ts1 (1:15)=[];
%                     his1 (1:15)=[];
%                     ts2 (1:15)=[];
%                     his2 (1:15)=[];
                    plot(ts1,his1,ts2,his2,ts3,his3);
                    legend('ADMM','DCA','DCA2');
                    HandleObj(X1)
                    HandleObj(X2)
                    HandleObj(X3)
     
                    ddddddd

                    t0 = clock;
                    [X3,his3,ts3] = DCA2_Adaptive(A,mu,r,X0,max_iter,time_limit);
                    X3 = OrthProj(X3);
                    t3 = etime(clock,t0);

                    plot(ts1,his1,ts2,his2,ts3,his3);
                    legend('method 1','method 2','method 3');
                    HandleObj(X1)
                    HandleObj(X2)
                    HandleObj(X3)
                    dddddd
                    t0 = clock;
                    [X4]= PAMAL_spca(-A,n,r,mu,max_iter,tol,X0,inner_iter,time_limit);
                    X4 = OrthProj(X4);
                    t4 = etime(clock,t0);
                    
                    t0 = clock;
                    [X5]= manpg_orth_sparse(-A,n,r,mu,X0,tol,inner_iter,time_limit);
                    X5 = OrthProj(X5);
                    t5 = etime(clock,t0);
                    
                    t0 = clock;
                    [X6]= manpg_orth_sparse_adap(-A,n,r,mu,X0,tol,inner_iter,time_limit);
                    X6 = OrthProj(X6);
                    t6 = etime(clock,t0);
                 
                    t0 = clock;
                    [X7]= Re_sub_grad_spca(-A,n,r,mu,X0,time_limit);
                    X7 = OrthProj(X7);
                    t7 = etime(clock,t0);
                    
                    t0 = clock;
                    [X8]= soc_spca(-A,n,r,mu,tol,X0,time_limit);
                    X8 = OrthProj(X8);
                    t8 = etime(clock,t0);
                    
                    
                    f1 = HandleObj(X1);
                    f2 = HandleObj(X2);
                    f3 = HandleObj(X3);
                    f4 = HandleObj(X4);
                    f5 = HandleObj(X5);
                    f6 = HandleObj(X6);
                    f7 = HandleObj(X7);
                    f8 = HandleObj(X8);
                    
                    
                    f1s(i_rnd) = f1;
                    f2s(i_rnd) = f2;
                    f3s(i_rnd) = f3;
                    f4s(i_rnd) = f4;
                    f5s(i_rnd) = f5;
                    f6s(i_rnd) = f6;
                    f7s(i_rnd) = f7;
                    f8s(i_rnd) = f8;
                    
                    plot(ts1,his1,ts2,his2,ts3,his3,ts4,his4,ts5,his5,ts6,his6,ts7,his7,ts8,his8);
                    legend('method 1','method 2','method 3','method 4','method 5','method 6','method 7','method 8');
                    
                end
                
                
                
                fprintf('                  ADMM: %f, time:%f, L1 norm :%f\n',mean(f1s),t1,sum(abs(X1(:))));
                fprintf('                  DCA1: %f, time:%f, L1 norm :%f\n',mean(f2s),t2,sum(abs(X2(:))));
                fprintf('                  DCA2: %f, time:%f, L1 norm :%f\n',mean(f3s),t3,sum(abs(X3(:))));
                fprintf('            PAMAL_spca: %f, time:%f, L1 norm :%f\n',mean(f4s),t4,sum(abs(X4(:))));
                fprintf('     manpg_orth_sparse: %f, time:%f, L1 norm :%f\n',mean(f5s),t5,sum(abs(X5(:))));
                fprintf('manpg_orth_sparse_adap: %f, time:%f, L1 norm :%f\n',mean(f6s),t6,sum(abs(X6(:))));
                 fprintf('     Re_sub_grad_spca: %f, time:%f, L1 norm :%f\n',mean(f7s),t7,sum(abs(X7(:))));
                fprintf('              soc_spca: %f, time:%f, L1 norm :%f\n',mean(f8s),t8,sum(abs(X8(:))));
                fprintf('----------------------------------------------------------------------------------\n');
            dddddd
            end
            
        end
        
    end
end

%% plot

% figure(1);
% plot(n_set, time.manpg, 'r-','linewidth',1); hold on;
% plot(n_set, time.manpg_BB, 'k-','linewidth',1); hold on;
% plot(n_set, time.soc, 'b--','linewidth',1); hold on;
% plot(n_set, time.pamal, 'c-.','linewidth',2); hold on;
% %plot(n_set, time.Rsub, 'g-.','linewidth',2);
% xlabel('dimenion-n');   ylabel('CPU');
% title(['comparison on CPU: different dimension',',r=',num2str(r),',\mu=',num2str(mu)]);
% legend('ManPG','ManPG-adap','SOC','PAMAL','Location','NorthWest');
% filename_pic1 = ['SPCA_CPU_n',  '_' num2str(r) '_' num2str(mu)  '.eps'];
% saveas(gcf,filename_pic1,'epsc')
%
%
% figure(2)
% semilogy(n_set, Fval.manpg-Fval.best+1e-16, 'r-s','MarkerSize',10,'linewidth',1); hold on;
% semilogy(n_set, Fval.manpg_BB-Fval.best+1e-16, 'k-o','MarkerSize',6,'linewidth',1); hold on;
% semilogy(n_set, Fval.soc-Fval.best+1e-16, 'b-d','MarkerSize',8,'linewidth',1); hold on;
% semilogy(n_set, Fval.pamal-Fval.best+1e-16, 'c-.','MarkerSize',20,'linewidth',1.5); hold on;
% %semilogy(n_set, Fval.Rsub -Fval.best+1e-16, 'g-.','MarkerSize',20,'linewidth',1.5);
% %legend('ManPG','ManPG-BB','SOC','PAMAL','Rsub','Location','NorthWest');
% legend('ManPG','ManPG-adap','SOC','PAMAL','Location','NorthWest');
%
% xlabel('dimenion-n');   ylabel('fucntion value difference');
% title(['comparison on function value difference: different dimension',',r=',num2str(r),',\mu=',num2str(mu)]);
% filename_pic2 = ['SPCA_Fval_n',  '_' num2str(r) '_' num2str(mu)  '.eps'];
% saveas(gcf,filename_pic2,'epsc')
%
% %
% %
% figure(3)
% plot(n_set, Sp.manpg, 'r-s','MarkerSize',10,'linewidth',1); hold on;
% plot(n_set, Sp.manpg_BB, 'k-o','MarkerSize',6,'linewidth',1); hold on;
% plot(n_set, Sp.soc, 'b-d','MarkerSize',8,'linewidth',1); hold on;
% plot(n_set, Sp.pamal, 'c-.','MarkerSize',20,'linewidth',1.5); hold on;
% %plot(n_set, Sp.Rsub, 'g-.','MarkerSize',20,'linewidth',1.5); %hold on;
% xlabel('dimenion-n');   ylabel('sparsity');
% legend('ManPG','ManPG-adap','SOC','PAMAL','Location','SouthEast');
% title(['comparison on sparsity: different dimension',',r=',num2str(r),',\mu=',num2str(mu)]);
% filename_pic3 = ['SPCA_Sparsity_n',  '_' num2str(r)  '_' num2str(mu) '.eps'];
% saveas(gcf,filename_pic3,'epsc')
%
%
% figure(4)
% plot(n_set, iter.manpg, 'r-s','MarkerSize',10,'linewidth',1); hold on;
% plot(n_set, iter.manpg_BB, 'k-o','MarkerSize',6,'linewidth',1); hold on;
% plot(n_set, iter.soc, 'b-d','MarkerSize',8,'linewidth',1); hold on;
% plot(n_set, iter.pamal, 'c-.','MarkerSize',20,'linewidth',1.5); %hold on;
% %plot(n_set, iter.Rsub, 'g-.','MarkerSize',20,'linewidth',1.5); %hold on;
% xlabel('dimenion-n');   ylabel('iter');
% legend('ManPG','ManPG-adap','SOC','PAMAL','Location','NorthWest');
% title(['comparison on iter: different dimension',',r=',num2str(r),',\mu=',num2str(mu)]);
% filename_pic4= ['SPCA_iter_n',  '_'  num2str(r)  '_' num2str(mu) '.eps'];
% saveas(gcf,filename_pic4,'epsc')
%
% close(figure(1));
% close(figure(2));
% close(figure(3));
% close(figure(4));
% filename = ['SPCA_comparison_n_'  num2str(r_set(id_r)) '_'  num2str(mu_set(id_mu)) '.csv'];
% csvwrite( filename, Result);

function [Best_X,histroy,ts] = ADMM(A,mu,r,X0,max_iter,time_limit)
% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X} trace(Y'AY) + mu*norm(X,1), X = Y, Y is orth
% L(X,Y,pi) = trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2, s.t. Y is orth


X = X0;
 
% A = A + abs(laneig((A+A')/2,1))*eye(size(A,1));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);

% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;
rho = 1*mu;


nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
rho_max = 2*normA*sqrt(r) + mu*sqrt(nr);
rho_max  = rho_max * 10;


rho = rho_max/(scale^20); %scale = 1;
 rho = rho_max ; scale = 2;
 
rho = 1;
Pi = randn(size(X))*1;
ts = [];
histroy = [];
% Y =  OrthProj(randn(size(X))); 
Y =  X; 
% beta = 100;

oooo = [];
for iter = 1:1000000

%     Lag = mdot(Y,A*Y) + mu*norm(X(:),1) + mdot(X-Y,Pi) + 0.5*beta*norm(X-Y,'fro')^2;
% oooo = [oooo;Lag];

% update X
% trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2
% mu*norm(X,1) + 0.5 beta ||X-Y + Pi/beta||_F^2
   [X] = prox_l1(Y-Pi/rho,mu/rho);

% Lag = mdot(Y,A*Y) + mu*norm(X(:),1) + mdot(X-Y,Pi) + 0.5*beta*norm(X-Y,'fro')^2;
% oooo = [oooo;Lag];

    % update Y
    % trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2
    % trace(Y'AY) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2
    % trace(Y'AY) + <X-Y,Pi> + 0.5 beta ||X-Y + Pi/beta||_F^2

% Lag = mdot(Y,A*Y) + mu*norm(X(:),1) + mdot(X-Y,Pi) + 0.5*beta*norm(X-Y,'fro')^2;
% mdot(Y,A*Y) + 0.5*beta*norm(X-Y+Pi/beta,'fro')^2;
O = X + Pi/rho;
% HandleObj_X = @(Y)mdot(Y,A*Y) + 0.5*beta*norm(Y-O,'fro')^2;
    L = 2*normA + rho;
%      L = 2*normA ;

    grad = 2*A*Y + rho*(Y-O);

    Y = OrthProj(Y - grad/L);

    diff = X - Y;
    Pi = Pi + rho * diff;
%     rho = rho + 10* norm(diff);
    true_fobj = HandleObjTrue(Y);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    dist = norm(diff,'fro');
    fprintf('iter:%d, dist: %f, fobj:%e, rho:%e\n',iter,dist,true_fobj,rho);

    histroy =[histroy;true_fobj];
    if(true_fobj< Best_X_f)
        Best_X = Y;
        Best_X_f = true_fobj;
    end
    
    
%      if(~mod(iter,30))
%         fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
%             iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
%      end
    
    

    
cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
        break;
    end

    if ~mod(iter,30) % && (dist > 1e-3)
        rho = min(1e10,rho * scale);
    end



%     hhhhh = clock();
% %     if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
% %         tttt1 = hhhhh;
% %         rho = rho * scale;
% % %           rho = rho_max;
% %     end
%     
%     
%     if(norm(X,'fro')^2 < r*0.9)
%         rho = rho * scale;
% %           rho = rho_max;
%     end
%     rho = min(1e8,rho);
    
    

end
% plot(histroy)
% dd
Best_X = OrthProj(Best_X);
 
function [X,histroy,ts] = ADMM_LineSearch(A,mu,r,X0,max_iter,time_limit)
% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X} trace(Y'AY) + mu*norm(X,1), X = Y, Y is orth
% L(X,Y,pi) = trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2, s.t. Y is orth
% L(X,Y,pi) = trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta (r-2<X,Y> + <Y,Y>), s.t. Y is orth


X = X0;
 
% A = A + abs(laneig((A+A')/2,1))*eye(size(A,1));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);

% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;
rho = 1*mu;

nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
rho_max = 2*normA*sqrt(r) + mu*sqrt(nr);
rho_max  = rho_max * 10;


rho = rho_max/(scale^20); %scale = 1;
 rho = rho_max ; scale = 1;
 
% rho = 10;
Pi = randn(size(X))*0;
ts = [];
histroy = [];
% Y =  OrthProj(randn(size(X))); 
Y =  X; 
% beta = 100;

oooo = [];

MeriteFunction = @(X,Y)trace(Y'*A*Y) + mu*norm(X,1) + 0.5*rho_max*norm(X-Y,'fro')^2;
fobj = MeriteFunction(X,Y);

for iter = 1:1000000

%     Lag = mdot(Y,A*Y) + mu*norm(X(:),1) + mdot(X-Y,Pi) + 0.5*beta*norm(X-Y,'fro')^2;
% oooo = [oooo;Lag];

% update X
% trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2
% mu*norm(X,1) + 0.5 beta ||X-Y + Pi/beta||_F^2
    % L(X,Y,pi) = trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 rho (r-2<X,Y> + <X,X>), s.t. Y is orth
    % L(X,Y,pi) = mu*norm(X,1) + 0.5 rho ||X - (Y-Pi/rho)||_2^2
   [X] = prox_l1(Y-Pi/rho,mu/rho);
   fobj_old = fobj;
fobj = MeriteFunction(X,Y);
hhh = fobj - fobj_old;
 
% Lag = mdot(Y,A*Y) + mu*norm(X(:),1) + mdot(X-Y,Pi) + 0.5*beta*norm(X-Y,'fro')^2;
% oooo = [oooo;Lag];

    % update Y
    % trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2
    % trace(Y'AY) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2
    % trace(Y'AY) + <X-Y,Pi> + 0.5 beta ||X-Y + Pi/beta||_F^2

% Lag = mdot(Y,A*Y) + mu*norm(X(:),1) + mdot(X-Y,Pi) + 0.5*beta*norm(X-Y,'fro')^2;
% mdot(Y,A*Y) + 0.5*beta*norm(X-Y+Pi/beta,'fro')^2;
O = X + Pi/rho;
% HandleObj_X = @(Y)mdot(Y,A*Y) + 0.5*beta*norm(Y-O,'fro')^2;
    L = 2*normA + rho;
%      L = 2*normA ;

    grad = 2*A*Y + rho*(Y-O);

    Y = OrthProj(Y - grad/L);
   fobj_old = fobj;
fobj = MeriteFunction(X,Y);
hhh2 = fobj - fobj_old;


 fobj_old = fobj;

% for iiii= 1:1000000
    diff = X - Y;
    step = 0.5^2;
    Pi_test = Pi + step*rho * diff;
%     fobj = trace(Y'*A*Y) + mu*norm(X,1) + mdot(X-Y,Pi_test) + 0.5*rho*norm(X-Y,'fro')^2;
%     if(fobj<fobj_old),break;end
% end

Pi = Pi_test;
    
    
    rho = rho + 10* norm(diff);
    true_fobj = HandleObjTrue(Y);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    dist = norm(diff,'fro');
    fprintf('iter:%d, dist: %f, fobj:%e, rho:%e\n',iter,dist,true_fobj,rho);

    histroy =[histroy;true_fobj];
    if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
    end
    
    X
    Y
%      if(~mod(iter,30))
%         fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
%             iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
%      end
    
    

    
cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
        break;
    end

%     if ~mod(iter,30)% && (dist > 1e-3)
%         rho = rho * scale;
%     end


%     hhhhh = clock();
% %     if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
% %         tttt1 = hhhhh;
% %         rho = rho * scale;
% % %           rho = rho_max;
% %     end
%     
%     
%     if(norm(X,'fro')^2 < r*0.9)
%         rho = rho * scale;
% %           rho = rho_max;
%     end
%     rho = min(1e8,rho);
    
    

end
% plot(histroy)
% dd
X = OrthProj(Best_X);
ddd

function [X,histroy,ts] = ADMM_new(A,mu,r,X0,max_iter,time_limit)
% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X} trace(Y'AY) + mu*norm(X,1), X = Y, Y is orth
% L(X,Y,pi) = trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2, s.t. Y is orth
% L(X,Y,pi) = trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta (r-2<X,Y> + <Y,Y>), s.t. Y is orth


X = X0;
 
% A = A + abs(laneig((A+A')/2,1))*eye(size(A,1));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);

% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;
rho = 1*mu;

nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
rho_max = 2*normA*sqrt(r) + mu*sqrt(nr);
rho_max  = rho_max * 10;


rho = rho_max/(scale^20); %scale = 1;
 rho = rho_max ; scale = 1;
 
rho = 10;
Pi = randn(size(X))*1;
ts = [];
histroy = [];
% Y =  OrthProj(randn(size(X))); 
Y =  X; 
% beta = 100;

oooo = [];
for iter = 1:1000000

%     Lag = mdot(Y,A*Y) + mu*norm(X(:),1) + mdot(X-Y,Pi) + 0.5*beta*norm(X-Y,'fro')^2;
% oooo = [oooo;Lag];

% update X
% trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2
% mu*norm(X,1) + 0.5 beta ||X-Y + Pi/beta||_F^2
    % L(X,Y,pi) = trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 rho (r-2<X,Y> + <X,X>), s.t. Y is orth
    % L(X,Y,pi) = mu*norm(X,1) + 0.5 rho ||X - (Y-Pi/rho)||_2^2
   [X] = prox_l1(Y-Pi/rho,mu/rho);

% Lag = mdot(Y,A*Y) + mu*norm(X(:),1) + mdot(X-Y,Pi) + 0.5*beta*norm(X-Y,'fro')^2;
% oooo = [oooo;Lag];

    % update Y
    % trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2
    % trace(Y'AY) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2
    % trace(Y'AY) + <X-Y,Pi> + 0.5 beta ||X-Y + Pi/beta||_F^2

% Lag = mdot(Y,A*Y) + mu*norm(X(:),1) + mdot(X-Y,Pi) + 0.5*beta*norm(X-Y,'fro')^2;
% mdot(Y,A*Y) + 0.5*beta*norm(X-Y+Pi/beta,'fro')^2;
O = X + Pi/rho;
% HandleObj_X = @(Y)mdot(Y,A*Y) + 0.5*beta*norm(Y-O,'fro')^2;
    L = 2*normA + rho;
%      L = 2*normA ;

    grad = 2*A*Y + rho*(Y-O);

    Y = OrthProj(Y - grad/L);


    diff = X - Y;
    Pi = Pi + rho * diff;
    rho = rho + 10* norm(diff);
    true_fobj = HandleObjTrue(Y);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    dist = norm(diff,'fro');
    fprintf('iter:%d, dist: %f, fobj:%e, rho:%e\n',iter,dist,true_fobj,rho);

    histroy =[histroy;true_fobj];
    if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
    end
    
    X
    Y
%      if(~mod(iter,30))
%         fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
%             iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
%      end
    
    

    
cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
        break;
    end

%     if ~mod(iter,30)% && (dist > 1e-3)
%         rho = rho * scale;
%     end


%     hhhhh = clock();
% %     if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
% %         tttt1 = hhhhh;
% %         rho = rho * scale;
% % %           rho = rho_max;
% %     end
%     
%     
%     if(norm(X,'fro')^2 < r*0.9)
%         rho = rho * scale;
% %           rho = rho_max;
%     end
%     rho = min(1e8,rho);
    
    

end
% plot(histroy)
% dd
X = OrthProj(Best_X);
ddd

function [X,histroy,ts] = ADMM11(A,mu,r,X0,max_iter,time_limit)
% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X} trace(Y'AY) + mu*norm(X,1), X = Y, Y is orth
% L(X,Y,pi) = trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2, s.t. Y is orth


X = X0;
 
% A = A + abs(laneig((A+A')/2,1))*eye(size(A,1));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);

% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;
rho = 1*mu;


nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
rho_max = 2*normA*sqrt(r) + mu*sqrt(nr);
rho_max  = rho_max * 10;


rho = rho_max/(scale^20); %scale = 1;
% rho = rho_max ;scale = 1;
% rho = rho_max;
rho = 1;
Pi = randn(size(X))*0;
ts = [];
histroy = [];
% Y =  OrthProj(randn(size(X))); 
Y =  X; 
% beta = 100;
gamma = 0.5;
oooo = [];
for iter = 1:1000000
gamma = 1/iter;
%     Lag = mdot(Y,A*Y) + mu*norm(X(:),1) + mdot(X-Y,Pi) + 0.5*beta*norm(X-Y,'fro')^2;
% oooo = [oooo;Lag];

% update X
% trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2
% mu*norm(X,1) + 0.5 beta ||X-Y + Pi/beta||_F^2
   [X] = prox_l1(Y-Pi/rho,mu/rho);

% Lag = mdot(Y,A*Y) + mu*norm(X(:),1) + mdot(X-Y,Pi) + 0.5*beta*norm(X-Y,'fro')^2;
% oooo = [oooo;Lag];

    % update Y
    % trace(Y'AY) + mu*norm(X,1) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2
    % trace(Y'AY) + <X-Y,Pi> + 0.5 beta ||X-Y||_F^2
    % trace(Y'AY) + <X-Y,Pi> + 0.5 beta ||X-Y + Pi/beta||_F^2

% Lag = mdot(Y,A*Y) + mu*norm(X(:),1) + mdot(X-Y,Pi) + 0.5*beta*norm(X-Y,'fro')^2;
% mdot(Y,A*Y) + 0.5*beta*norm(X-Y+Pi/beta,'fro')^2;
O = X + gamma*Pi/(rho);
% HandleObj_X = @(Y)mdot(Y,A*Y) + 0.5*beta*norm(Y-O,'fro')^2;
    L = 2*normA + rho;
%      L = 2*normA ;

    grad = 2*A*Y + rho*(Y-O);

    Y = OrthProj(Y - grad/L);

    diff = X - Y;
    Pi = gamma*Pi + (1-gamma)*rho*diff;

    rho = rho + norm(diff);
    true_fobj = HandleObjTrue(Y);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    dist = norm(diff,'fro');
    fprintf('iter:%d, dist: %f, fobj:%e, rho:%e\n',iter,dist,true_fobj,rho);

    histroy =[histroy;true_fobj];
    if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
    end
    
    
%      if(~mod(iter,30))
%         fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
%             iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
%      end
    
    

    
cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
        break;
    end

%     if ~mod(iter,30)% && (dist > 1e-3)
%         rho = rho * scale;
%     end


%     hhhhh = clock();
% %     if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
% %         tttt1 = hhhhh;
% %         rho = rho * scale;
% % %           rho = rho_max;
% %     end
%     
%     
%     if(norm(X,'fro')^2 < r*0.9)
%         rho = rho * scale;
% %           rho = rho_max;
%     end
%     rho = min(1e8,rho);
    
    

end
% plot(histroy)
% dd
X = OrthProj(Best_X);
 
function [X,histroy,ts] = DCA2(A,mu,r,X0,max_iter,time_limit)

% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X,Y} trace(X'AX) + mu*norm(X,1), sigma(Y)<=1, ||X||_F^2 <= r, <X,Y> = r
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2), sigma(X)<=1

% ||2*A*X + mu sign(X)||_F 
% 2||AX||_F + mu ||sign(X)||_F
% 2*normA*sqrt(r) +  mu*sqrt(nr)

X = X0;
 
% A = A + abs(laneig((A+A')/2,1))*eye(size(A,1));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);

% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;
rho = 1*mu;


nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
rho_max = 2*normA*sqrt(r) + mu*sqrt(nr);
rho_max  = rho_max * 10;


rho = rho_max/(scale^20); %scale = 1;
% rho = rho_max ;scale = 1;

ts = [];
histroy = [];
for iter = 1:max_iter

    % update Y
    % min_{Y} mu*norm(Y,1) + rho ||Y-X||_F^2
    % min_{Y} 0.5mu/rho*norm(Y,1) + 0.5||Y-X||_F^2
    
    [Y] = prox_l1(X,0.5*mu/rho);

    % min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2)
    
    % update X
    % min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-2*<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r
    % min_{X} trace(X'AX) - rho <X,Y>, sigma(X)<=1
   L = 2*normA;
    grad = 2*A*X - rho*2*Y;
     [X] = OrthProj(X - grad/L);

% HandleObj_X = @(X)mdot(X,A*X) - rho*2*mdot(X,Y);
% %     L = 1;
%     fobj_old = HandleObj_X(X);
%     for in =1:100
%     grad = 2*A*X - rho*2*Y;
%     [X] = OrthProj(X - grad/L);
%     if(HandleObj_X(X)<fobj_old)
%         break;
%     end
%     L = L*2;
%     end
    dist = abs(r -2*mdot(X,Y)+mdot(Y,Y));

 
    true_fobj = HandleObjTrue(X);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    
    histroy =[histroy;true_fobj];
    if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
    end
    
    
%      if(~mod(iter,30))
%         fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
%             iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
%      end
    
    

    
cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
        break;
    end

    
    hhhhh = clock();
    if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
        tttt1 = hhhhh;
        rho = rho * scale;
%           rho = rho_max;
    end
    
    
    if(norm(X,'fro')^2 < r*0.9)
        rho = rho * scale;
%           rho = rho_max;
    end
    rho = min(rho_max,rho);
end
X = OrthProj(Best_X);




function [X,histroy,ts] = DCA2_Adaptive2(A,mu,r,X0,max_iter,time_limit)

% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X,Y} trace(X'AX) + mu*norm(X,1), sigma(Y)<=1, ||X||_F^2 <= r, <X,Y> = r
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2), sigma(X)<=1

% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2 + ||X-Xt||_F^2)

% ||2*A*X + mu sign(X)||_F 
% 2||AX||_F + mu ||sign(X)||_F
% 2*normA*sqrt(r) +  mu*sqrt(nr)
X0 = OrthProj(X0);
X = X0;
 
% A = A + abs(laneig((A+A')/2,1))*eye(size(A,1));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);

% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;



nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
rho_max = 2*normA*sqrt(r) + mu*sqrt(nr);
% rho_max  = rho_max * 10;

% rho = rho_max/(scale^20); %scale = 1;
% % rho = rho_max ;scale = 1;
% rho0 = 0.01;
% beta = rho_max; 
rho = 0.01;
 
ts = [];
histroy = [];
Y = X;
% HandleFun = @(X,Y,rho)trace(X'*A*X) + mu*norm(Y,1) + rho*(r-2*mdot(X,Y)+norm(Y,'fro')^2);
% last_obj = HandleFun(X,Y,rho);
% curr_obj = last_obj;
restate = 0;
for iter = 1:max_iter
 

restate = restate + 1;
    % update Y
    % min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2 + ||X-Xt||_F^2)
    % min_{Y} mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2)
    % min_{Y} mu*norm(Y,1) + rho ||Y-X||_F^2 
    % min_{Y} 0.5 mu/rho*norm(Y,1) + 0.5||Y-X||_F^2 
    [Y] = prox_l1(X,0.5*mu/(rho));

    % update X
    % min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2 + ||X-Xt||_F^2)
    
    L = 2*normA;
    grad = 2*A*X - rho*2*Y;

    X_old = X;
    [X] = OrthProj(X - grad/L);
    
    
    
%     last_obj = curr_obj;
%     curr_obj = HandleFun(X,Y,rho);
%     diff_f =  last_obj-curr_obj;
    
    if ((norm(X-X_old)<1e-3) && (restate>=10)) || (restate>=50)
        rho = min(1e10,rho*2);
        restate = 0;
    end
    
%     if( abs(diff_f / abs(1+curr_obj))<1e-6) && (restate>=10)
%         rho = min(1e10,rho*2);
%         restate = 0;
%     end
%     diff_X = norm(X-X_old,'fro');
%     if(diff_f/diff_X<0.01)
%        beta = min(1e10,beta*2);
%        curr_obj = HandleFun(X,Y,beta);
%     end

%    if(diff_f/diff_X < -1e-5)
%    end
%     if(curr_obj - last_obj )
% end
% if(~mod(iter,30))
     dist = r -2*mdot(X,Y)+mdot(Y,Y);
% 
% 
%     if(dist<0),
%         error('negative!');
%     end
% 
% %      beta = beta + stepsize*(r-2*mdot(X,Y)+mdot(Y,Y));
%     
    true_fobj = HandleObjTrue(X);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    %fprintf('iter:%d, dist:%f, tfobj:%f, beta:%f\n',iter,dist,true_fobj,beta);
      fprintf('iter:%d, dist: %f, fobj:%e, rho:%e\n',iter,dist,true_fobj,rho);
          histroy =[histroy;true_fobj];
          
              if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
              end
    
              cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
         break;
    end

% end
      


    
    
%      if(~mod(iter,30))
%         fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
%             iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
%      end
  
    

    
%     hhhhh = clock();
%     if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
%         tttt1 = hhhhh;
%         rho = rho * scale;
% %           rho = rho_max;
%     end
    
    
%     if(norm(X,'fro')^2 < r*0.9)
%         rho = rho * scale;
% %           rho = rho_max;
%     end
%     rho = min(rho_max,rho);
end
X = OrthProj(Best_X);

function [X,histroy,ts] = DCA2_Adaptive_bak(A,mu,r,X0,max_iter,time_limit)

% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X,Y} trace(X'AX) + mu*norm(X,1), sigma(Y)<=1, ||X||_F^2 <= r, <X,Y> = r
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2), sigma(X)<=1

% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2) + beta (r-2<X,Y>+||Y||_F^2)

% ||2*A*X + mu sign(X)||_F 
% 2||AX||_F + mu ||sign(X)||_F
% 2*normA*sqrt(r) +  mu*sqrt(nr)
X0 = OrthProj(X0);
X = X0;
 
% A = A + abs(laneig((A+A')/2,1))*eye(size(A,1));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);

% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;



nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
rho_max = 2*normA*sqrt(r) + mu*sqrt(nr);
% rho_max  = rho_max * 10;

% rho = rho_max/(scale^20); %scale = 1;
% % rho = rho_max ;scale = 1;
% rho0 = 0.01;
% beta = rho_max; 
beta = 1;
stepsize = 100;
ts = [];
histroy = [];
for iter = 1:max_iter
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + (rho+beta) (r-2<X,Y>+||Y||_F^2)


% for in = 1:20
    % update Y
    % min_{Y} mu*norm(Y,1) + (rho+beta) ||Y-X||_F^2
    % min_{Y} 0.5mu/(rho+beta)*norm(Y,1) + 0.5||Y-X||_F^2
    
    [Y] = prox_l1(X,0.5*mu/(beta));

    % min_{X,Y} trace(X'AX) + mu*norm(Y,1) + (rho+beta) (r-2<X,Y>+||Y||_F^2)
    
    % update X
    % min_{X,Y} trace(X'AX) + mu*norm(Y,1) + (rho+beta) (r-2*<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r
    % min_{X} trace(X'AX) - rho <X,Y>, sigma(X)<=1
    L = 2*normA;
    grad = 2*A*X - (beta)*2*Y;
    [X] = OrthProj(X - grad/L);

% end
if(~mod(iter,30))
    dist = r -2*mdot(X,Y)+mdot(Y,Y);


    if(dist<0),
        error('negative!');
    end

     beta = beta + stepsize*(r-2*mdot(X,Y)+mdot(Y,Y));
    
    true_fobj = HandleObjTrue(X);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    %fprintf('iter:%d, dist:%f, tfobj:%f, beta:%f\n',iter,dist,true_fobj,beta);
      fprintf('iter:%d, dist: %f, fobj:%e, rho:%e\n',iter,dist,true_fobj,beta);
          histroy =[histroy;true_fobj];
          
              if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
              end
    
              cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
         break;
    end

end
      


    
    
%      if(~mod(iter,30))
%         fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
%             iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
%      end
  
    

    
%     hhhhh = clock();
%     if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
%         tttt1 = hhhhh;
%         rho = rho * scale;
% %           rho = rho_max;
%     end
    
    
%     if(norm(X,'fro')^2 < r*0.9)
%         rho = rho * scale;
% %           rho = rho_max;
%     end
%     rho = min(rho_max,rho);
end
X = OrthProj(Best_X);

% plot(histroy)
% ddd
function [X,histroy,ts] = DCA_Adaptive(A,mu,r,X0,max_iter,time_limit)

% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X,Y} trace(X'AX) + mu*norm(X,1), sigma(Y)<=1, ||X||_F^2 <= r, <X,Y> = r
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r

% ||2*A*X + mu sign(X)||_F 
% 2||AX||_F + mu ||sign(X)||_F
% 2*normA*sqrt(r) +  mu*sqrt(nr)
X0 = OrthProj(X0);
X = X0;
 
% A = A + abs(laneig((A+A')/2,1))*eye(size(A,1));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);


% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;
rho = 1*mu;


nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
rho_max = 2*normA*sqrt(r) + mu*sqrt(nr);
 

rho = rho_max; stepsize = 0.5;
% rho = rho_max/(scale^20); %scale = 1;
rho = rho_max ;scale = 1;

ts = [];
histroy = [];
 rhos = [];
for iter = 1:max_iter

 
    % update Y
    % min_{Y} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r
    % min_{Y} mu*norm(Y,1) + rho (r-<X,Y>), ||Y||_F^2 <= r
    % min_{Y} mu*norm(Y,1) + 0.5 ||Y||_F^2 - rho <X,Y>, ||Y||_F^2 = r
    % min_{Y} mu*norm(Y,1) + 0.5 ||Y - rho X ||_F^2, ||Y||_F^2 = r
    
    [Y] = prox_l1_sphere(rho*X,mu,r);

    % update X
    % min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r
    % min_{X} trace(X'AX) - rho <X,Y>, sigma(X)<=1
   L = 2*normA;
    grad = 2*A*X - rho*Y;
 
    [X] = OrthProj(X - grad/L);
 
% HandleObj_X = @(X)mdot(X,A*X) - rho*mdot(X,Y);
%     L = 1;
%     fobj_old = HandleObj_X(X);
%     for in =1:100
%     grad = 2*A*X - rho*Y;
%     [X] = OrthProj(X - grad/L);
%     if(HandleObj_X(X)<fobj_old)
%         break;
%     end
%     L = L*2;
%     end
    
 
    true_fobj = HandleObjTrue(X);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    
    histroy =[histroy;true_fobj];
    if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
    end
    
    
%      if(~mod(iter,30))
%         fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
%             iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
%      end
      rho = rho + stepsize*(r-mdot(X,Y));
      rhos = [rhos;rho];
%       if(~mod(iter,10000))
%           close all;
%       plot(rhos)
       fprintf('iter:%d, fobj:%f, rho:%e, dist:%e\n',iter,true_fobj,rho,(r-mdot(X,Y)));
%       pause(1)
%       rhos = [];
%       end
% L = mdot(X,A*X) + mu*norm(Y,1) + rho*(r-mdot(X,Y));
% if((L_old-L) / (norm(X-X_old,'fro')) > 1)
% rho = rho*2;
% 
% end
% 

% L_old = L;
%     
cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
          break;
    end

    
%     hhhhh = clock();
%     if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
%         tttt1 = hhhhh;
%         rho = rho * scale;
% %           rho = rho_max;
%     end
    
    
%     if(norm(X,'fro')^2 < r*0.9)
%         rho = rho * scale;
% %           rho = rho_max;
%     end
%     rho = min(rho_max,rho);
end
X = OrthProj(Best_X);
%  plot(histroy)
%  ddd
function [X,histroy,ts] = DCA_SpectralGradient_Monotone(A,mu,r,X0,max_iter,time_limit)

% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X,Y} trace(X'AX) + mu*norm(X,1), sigma(Y)<=1, ||X||_F^2 <= r, <X,Y> = r
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r

X = X0;
 
% A = A + abs(laneig((A+A')/2,1))*eye(size(A,1));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);


% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;
rho = 1*mu;

alpha = 1;
nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
% rho_max = sqrt(2)* (2*normA*sqrt(r) + mu*sqrt(nr));


rho_max =2* (2*normA*sqrt(r) + mu*sqrt(nr));

rho = rho_max/(scale^20); %scale = 1;
%  rho = rho_max ;scale = 1;
S = X;
ts = [];
histroy = [];
xxp = 0*X;
for iter = 1:max_iter

    % update Y
    % min_{Y} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r
    % min_{Y} mu*norm(Y,1) + rho (r-<X,Y>), ||Y||_F^2 <= r
    % min_{Y} mu*norm(Y,1) + 0.5 ||Y||_F^2 - rho <X,Y>, ||Y||_F^2 = r
    % min_{Y} mu*norm(Y,1) + 0.5 ||Y - rho X ||_F^2, ||Y||_F^2 = r
    
    [Y] = prox_l1_sphere(rho*X,mu,r);

    % update X
    % min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r
    % min_{X} trace(X'AX) - rho <X,Y>, sigma(X)<=1
    L = 2*normA;
   HandleObj_X = @(X)mdot(X,A*X) - rho*mdot(X,Y);
%     L = 1;
    [fobj_old] = HandleObj_X(S);
    xp=X;
    for in =1:100
    grad = 2*A*X - rho*Y;
    [X] = OrthProj(S - grad/L);
    if(HandleObj_X(X)<fobj_old)
        break;
    end
    L = L*2;
    end
    
    alphap=alpha; alpha = (1+ sqrt(4*alpha*alpha +1))/2;
    beta=(alphap-1)/alpha;
 
    S = X + beta* xxp;
    xxp = X-xp;

    dist = abs(r - mdot(X,Y));

    fff_XY = mdot(X,A*X) + mu*sum(abs(Y(:))) + rho*sqrt(r-mdot(X,Y));
    true_fobj = HandleObjTrue(X);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    
    histroy =[histroy;true_fobj];
    if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
    end
    
    
%      if(~mod(iter,30))
%         fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
%             iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
%      end
    
    
    
    
cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
        break;
    end

    
    hhhhh = clock();
    if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
        tttt1 = hhhhh;
        rho = rho * scale;
%           rho = rho_max;
    end
    
    
    if(norm(X,'fro')^2 < r*0.9)
        rho = rho * scale;
%           rho = rho_max;
    end
    rho = min(rho_max,rho);
end

X = proj_orth(Best_X);

function [X,histroy,ts] = DCA_SpectralGradient_Monotone1(A,mu,r,X0,max_iter,time_limit)

% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X,Y} trace(X'AX) + mu*norm(X,1), sigma(Y)<=1, ||X||_F^2 <= r, <X,Y> = r
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r

X = X0;
 
HandleObjTrue  = @(X)ComputeObj(X,A,mu);


% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;
 


nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
% rho_max = sqrt(2)* (2*normA*sqrt(r) + mu*sqrt(nr));


rho_max =2* (2*normA*sqrt(r) + mu*sqrt(nr));

rho = rho_max/(scale^20); %scale = 1;
rho = rho_max ;scale = 1;

ts = [];
histroy = [];


 
newstart = 1;

X = MGramSchmidt(X);
s = X;
x = s;
alpha = 1;
xxp = 0*x;

f_best = inf;
%% The main program
for iter=1:max_iter
    
      
       
    HandleObj = @(X)ComputePenObj(X,A,rho,r,mu);
 

    [f_old,g_old] = HandleObj(s);
    xp=x;
    max_in = 10000;
    L = 1;
    for in=1:max_in,

        v=s-g_old/L;
        % min_{x} 0.5 L ||x-(xt-g/L)||^2 + z * ||x||_1
        [x]=OrthProj(v);
 
        f_new = HandleObj(x);

        l_sum = f_new - f_old ;

        if(l_sum <  0)
            break;
        else
            L=2*L;
        end
        if(in==max_in)
            fprintf('warning! Lipschitz too large!');
        end
        
    end
 
    alphap=alpha; alpha = (1+ sqrt(4*alpha*alpha +1))/2;
    beta=(alphap-1)/alpha;
    beta = 0;
    s = x + beta* xxp;
    xxp = x-xp;
    f_curr = f_new  ;
    if(f_curr<f_best)
        f_best = f_curr;
        x_best = x;
    end
 
    
    
    
        true_fobj = HandleObjTrue(x);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    
    histroy =[histroy;true_fobj];
    if(true_fobj< Best_X_f)
        Best_X = x;
        Best_X_f = true_fobj;
    end
    
    cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
        break;
    end

    
    hhhhh = clock();
    if( etime(hhhhh,tttt1) > each ) %&& (dist > 1e-3)
        tttt1 = hhhhh;
        rho = rho * scale;newstart=1;
%            rho = rho_max;
    end
    
    
    if(norm(X,'fro')^2 < r*0.9)
        rho = rho * scale;
% % %           rho = rho_max;
newstart=1;
    end
    rho = min(rho_max,rho);
    
    
    continue;
    
    % method bb
%      X = OptStiefelGBB1(X,HandleObj);
% 
%      
%     true_fobj = HandleObjTrue(X);
%     % true_fobj = HandleObjPenalty(X,Y,rho);
%     
%     histroy =[histroy;true_fobj];
%     if(true_fobj< Best_X_f)
%         Best_X = X;
%         Best_X_f = true_fobj;
%     end
%     
%     cur_t = etime(clock(),t00000);
%     ts = [ts;cur_t];
%     if (cur_t > time_limit),
%         break;
%     end
% 
%     
%     hhhhh = clock();
%     if( etime(hhhhh,tttt1) > each ) %&& (dist > 1e-3)
%         tttt1 = hhhhh;
%         rho = rho * scale;newstart=1;
% %            rho = rho_max;
%     end
%     
%     
%     if(norm(X,'fro')^2 < r*0.9)
%         rho = rho * scale;
% % % %           rho = rho_max;
% newstart=1;
%     end
%     rho = min(rho_max,rho);
%     
%     
%  
%  
%      continue;
     
    [fobj,Grad] = HandleObj(X);
     
    if(newstart==1)
        stepsize = 1;
    else
        delta_X = X - X_old;
        delta_grad = Grad - Grad_old;
%         stepsize = mdot(delta_X,delta_grad) / mdot(delta_X,delta_X);
        stepsize = mdot(delta_X,delta_grad) / mdot(delta_grad,delta_grad);
 
        stepsize = max(min(stepsize, 1e10), 1e-10);
    end
    
    %%%%%%%% Line Search to find optimal step lambda %%%%%%%%
        for in = 1:100
            X_test = OrthProj(X - stepsize*Grad);
            [fobj_cur] = HandleObj(X_test);
            if(fobj_cur<fobj),
                break;
            end
            stepsize = stepsize / 2;
        end

    X = X_test;
    newstart = 0;
    X_old = X;
    Grad_old = Grad;
    
    Y = prox_l1_sphere(rho*X,mu,r);
%     dist = abs(r - mdot(X,Y));

    fff_XY = mdot(X,A*X) + mu*sum(abs(Y(:))) + rho*sqrt(r-mdot(X,Y));
    true_fobj = HandleObjTrue(X);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    
    histroy =[histroy;true_fobj];
    if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
    end
    
    cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
        break;
    end

    
    hhhhh = clock();
    if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
        tttt1 = hhhhh;
        rho = rho * scale;newstart=1;
%            rho = rho_max;
    end
    
    
    if(norm(X,'fro')^2 < r*0.9)
        rho = rho * scale;
% % %           rho = rho_max;
newstart=1;
    end
    rho = min(rho_max,rho);

end

% plot(ts,histroy)

X = proj_orth(Best_X);

function [fobj,grad] = ComputePenObj(X,A,rho,r,mu)
AX = A*X;
Y = prox_l1_sphere(rho*X,mu,r);
fobj = mdot(X,AX) - rho*mdot(X,Y);
grad = 2*A*X - rho*Y;

function [X,histroy,ts] = DCA(A,mu,r,X0,max_iter,time_limit)

% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X,Y} trace(X'AX) + mu*norm(X,1), sigma(Y)<=1, ||X||_F^2 <= r, <X,Y> = r
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r

% ||2*A*X + mu sign(X)||_F 
% 2||AX||_F + mu ||sign(X)||_F
% 2*normA*sqrt(r) +  mu*sqrt(nr)

X = X0;
 
% A = A + abs(laneig((A+A')/2,1))*eye(size(A,1));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);


% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;
rho = 1*mu;


nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
rho_max = 2*normA*sqrt(r) + mu*sqrt(nr);
rho_max  = rho_max * 10;


rho = rho_max/(scale^20); %scale = 1;
%  rho = rho_max ;scale = 1;

ts = [];
histroy = [];
for iter = 1:max_iter

    % update Y
    % min_{Y} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r
    % min_{Y} mu*norm(Y,1) + rho (r-<X,Y>), ||Y||_F^2 <= r
    % min_{Y} mu*norm(Y,1) + 0.5 ||Y||_F^2 - rho <X,Y>, ||Y||_F^2 = r
    % min_{Y} mu*norm(Y,1) + 0.5 ||Y - rho X ||_F^2, ||Y||_F^2 = r
    
    [Y] = prox_l1_sphere(rho*X,mu,r);

    % update X
    % min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r
    % min_{X} trace(X'AX) - rho <X,Y>, sigma(X)<=1
   L = 2*normA;
    grad = 2*A*X - rho*Y;
    [X] = OrthProj(X - grad/L);
    
% HandleObj_X = @(X)mdot(X,A*X) - rho*mdot(X,Y);
%     L = 1;
%     fobj_old = HandleObj_X(X);
%     for in =1:100
%     grad = 2*A*X - rho*Y;
%     [X] = OrthProj(X - grad/L);
%     if(HandleObj_X(X)<fobj_old)
%         break;
%     end
%     L = L*2;
%     end
    
    dist = abs(r - mdot(X,Y));

    fff_XY = mdot(X,A*X) + mu*sum(abs(Y(:))) + rho*sqrt(r-mdot(X,Y));
    true_fobj = HandleObjTrue(X);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    
    histroy =[histroy;true_fobj];
    if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
    end
    
    
%      if(~mod(iter,30))
%         fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
%             iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
%      end
    
    

    
cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
        break;
    end

    
    hhhhh = clock();
    if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
        tttt1 = hhhhh;
        rho = rho * scale;
%           rho = rho_max;
    end
    
    
    if(norm(X,'fro')^2 < r*0.9)
        rho = rho * scale;
%           rho = rho_max;
    end
    rho = min(rho_max,rho);
end
X = proj_orth(Best_X);
% size(ts) 
% size(histroy) 
% plot(ts,histroy);
% ddd
% fprintf('Finished!\n');
% plot(histroy)
% dddd
function [X,histroy] = DCA0(A,mu,r,X0,max_iter,time_limit)
% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X,Y} trace(X'AX) + mu*norm(X,1), sigma(Y)<=1, ||X||_F^2 <= r, <X,Y> = r
% min_{X,Y} trace(X'AX) + mu*norm(X,1) + rho (r-<X,Y>), sigma(Y)<=1, ||X||_F^2 <= r

% min_{X} trace(X'AX) + mu*norm(X,1) + rho sqrt(r- ||X||_*), sigma(Y)<=1, ||X||_F^2 <= r


X = X0;
% HandleObjX = @(X)trace(X'*A*X) + mu*sum(abs(X(:))) + rho*(r - sum(svd(X)));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);


histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = histroy(1);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;
rho = 1*mu;


nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
% rho_max = sqrt(2)* (2*normA*sqrt(r) + mu*sqrt(nr));

rho_max = sqrt(2)* (2*normA*sqrt(r) + mu*sqrt(nr));

% rho = rho_max/(scale^20); %scale = 1;
 rho = rho_max ;scale = 1;

for iter = 1:max_iter
    
    
    % min_{Y} r-<X,Y>, sigma(Y)<=1
    % min_{Y} -<X,Y>, sigma(Y)=1
    % min_{Y} 0.5<Y,Y> - <X,Y>, sigma(Y)=1
    % min_{Y} 0.5||Y-X||_F^2, sigma(Y)=1
    [Y,nuclear_norm_X] = OrthProj(X);
    
    % fobj = trace(X'*A*X) + mu*norm(Y,1) + rho*(r-mdot(X,Y));
    % fobj = trace(X'*A*X) - rho*(mdot(X,Y));
    % grad = 2*A*X - rho*Y;
    % X = X - grad / Lip;
    
    % A is negative semidefinite
    % min_{X} trace(X'AX) + mu*norm(X,1) + rho (r-<X,Y>), s.t. ||X||_F^2 <= r
    down = sqrt(r-nuclear_norm_X);
    down = max(down,0.01);
    B = - rho*Y / (2 * down);
    % min_{X} trace(X'AX) + mu*norm(X,1) + <X,B>, s.t. ||X||_F^2 <= r
    [X] = AccerlatedProximalGradient_ConcaveMinimization1(X,A,B,mu,r,each);
 
    
    dist = abs(r - mdot(X,Y));
    

    fff_XY = mdot(X,A*X) + mu*sum(abs(X(:))) + rho*sqrt(r-mdot(X,Y));
    true_fobj = HandleObjTrue(X);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    
    histroy(iter+1)=true_fobj;
    if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
    end
    
    
     if(~mod(iter,30))
        fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
            iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
     end
    
    
    
    
    if (etime(clock(),t00000) > time_limit),
        break;
    end
    
    hhhhh = clock();
    if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
        tttt1 = hhhhh;
        rho = rho * scale;
    end
    
    
    if(norm(X,'fro')^2 < r*0.9)
        rho = rho * scale;
    end
    rho = min(rho_max,rho);
end

X = proj_orth(Best_X);
fprintf('Finished!\n');

function [X,histroy] = ExactPenalty_F1(A,mu,r,X0,max_iter,time_limit)
% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X,Y} trace(X'AX) + mu*norm(X,1), sigma(Y)<=1, ||X||_F^2 <= r, <X,Y> = r
% min_{X,Y} trace(X'AX) + mu*norm(X,1) + rho (r-<X,Y>), sigma(Y)<=1, ||X||_F^2 <= r

X = X0;
% HandleObjX = @(X)trace(X'*A*X) + mu*sum(abs(X(:))) + rho*(r - sum(svd(X)));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);


histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = histroy(1);
t1 = clock();
tttt1 = clock();
each = time_limit/50;
scale = 2;
rho = 0.1*mu;
for iter = 1:max_iter
    
    
    % min_{Y} r-<X,Y>, sigma(Y)<=1
    % min_{Y} -<X,Y>, sigma(Y)=1
    % min_{Y} 0.5<Y,Y> - <X,Y>, sigma(Y)=1
    % min_{Y} 0.5||Y-X||_F^2, sigma(Y)=1
    Y = OrthProj(X);
    
    % fobj = trace(X'*A*X) + mu*norm(Y,1) + rho*(r-mdot(X,Y));
    % fobj = trace(X'*A*X) - rho*(mdot(X,Y));
    % grad = 2*A*X - rho*Y;
    % X = X - grad / Lip;
    
    % A is negative semidefinite
    % min_{X} trace(X'AX) + mu*norm(X,1) + rho (r-<X,Y>), s.t. ||X||_F^2 <= r
    B = - rho*Y;
    % min_{X} trace(X'AX) + mu*norm(X,1) + <X,B>, s.t. ||X||_F^2 <= r
    [X] = ConcaveMinimization1(X,A,B,mu,r,each);
    
    %      HandleObj = @(X) ComputeObjSpectral(X,A,mu,rho,r);
    %      HandleProx = @(A,L)proj_orth_app(A);
    %      X = SpectralGradient_Monotone(X,HandleObj,HandleProx,Lip,1e-5); Y = OrthProj(rho*X);
    
    dist = abs(r - mdot(X,Y));
    
    
    
    
    fff_XY = mdot(X,A*X) + mu*sum(abs(X(:))) + rho*(r-mdot(X,Y));
    true_fobj = HandleObjTrue(X);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    
    histroy(iter+1)=true_fobj;
    if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
    end
    
    
    if(~mod(iter,30))
        fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
            iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
    end
    
    
    
    hhhhh = clock();
    if (etime(hhhhh,t1) > time_limit),
        break;
    end
    
    if( etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
        tttt1 = hhhhh;
        rho = rho * scale;
    end
    
    
    if(norm(X,'fro')^2 < r*0.9)
        rho = rho * scale;
    end
end

X = proj_orth(Best_X);
fprintf('Finished!\n');



function [X,histroy] = ExactPenalty_F2(A,mu,r,X0,max_iter,time_limit)
% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X,Y} trace(X'AX) + mu*norm(Y,1), sigma(X)<=1, ||Y||_F^2 <= r, <X,Y> = r
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r, <X,Y> = r




X = X0;

% HandleObjX = @(X)trace(X'*A*X) + mu*sum(abs(X(:))) + rho*(r - sum(svd(X)));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);
HandleObjPenalty = @(X,Y,rho)mdot(X,A*X) + mu*sum(abs(Y(:))) + rho*(r-mdot(X,Y));
histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = histroy(1);
t1 = clock();
tttt1 = clock();


each = time_limit/50;
scale = sqrt(2);
rho =0.1*mu;

for iter = 1:max_iter
    
    
    % min_Y mu ||Y||_1 - rho<X,Y>, s.t. ||Y||_F^2 <= r
    % min_Y mu ||Y||_1 - rho<X,Y>, s.t. ||Y||_F^2 = r
    % min_Y mu ||Y||_1 - rho<X,Y> + 0.5 ||Y||_F^2, s.t. ||Y||_F^2 = r
    % min_Y mu ||Y||_1 - rho<X,Y> + 0.5 ||Y||_F^2, s.t. ||Y||_F^2 = r
    
    Y = prox_l1_ball2(rho*X,mu,r);
    
    
    % fobj = trace(X'*A*X) + mu*norm(Y,1) + rho*(r-mdot(X,Y));
    % fobj = trace(X'*A*X) - rho*(mdot(X,Y));
    % grad = 2*A*X - rho*Y;
    % X = X - grad / Lip;
    
    % min_{X} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1
    B = - rho * Y;
    % min_{X} trace(X'AX) + <X,B>, sigma(X)<=1
    
    
     [X] = ConcaveMinimization2(X,A,B,each);
%     [X] = AccerlatedProximalGradient_ConcaveMinimization1(X,A,B,each);
    
    
    
    %     HandleObj = @(X)ComputeObj3333(X,A,mu,rho,r);
    %
    %    X = SpectralGradient_Monotone(X,HandleObj,HandleProx,Lip,tol/10);  Y = prox_l1_ball2(rho*X,mu,r);
    
    
    
    
    dist = abs(r - mdot(X,Y));
    fff_XY = HandleObjPenalty(X,Y,rho);
    true_fobj = HandleObjTrue(X);
    
    histroy(iter+1)=true_fobj;
    if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
    end
    
    if(~mod(iter,30))
        fprintf('iter:%d, true_fobj:%f, pen_fobj:%f, rho:%f, dist:%.4e, normX2:%.4e \n',...
            iter,true_fobj,fff_XY,rho,dist,norm(X,'fro')^2);
    end
    
    
    % last_k_ftol<tol && dist<tol && etime(clock(),t1) > time_limit) ||
    
    
    hhhhh = clock();
    if(etime(hhhhh,t1) > time_limit),break;end
    if(etime(hhhhh,tttt1) > each ) && (dist > 1e-3)
        tttt1 = hhhhh;
        rho = rho * scale;
    end
    
    if(norm(X,'fro')^2 < r*0.9)
        rho = rho * scale;
    end
    
end

X = proj_orth(Best_X);

fprintf('Finished!\n');















function [fobj,grad] = UpdateXComputeObj(X,A,rho,Y)
AX = A*X;
rhoY = rho*Y;
fobj = mdot(X,AX-rhoY) ;
grad = 2*AX - rhoY;


function [fobj,grad] = ComputeObjSpectral(X,A,mu,rho,r)
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-<X,Y>), sigma(X)<=1, ||Y||_F^2 <= r, <X,Y> = r
% min_{Y} mu*norm(Y,1) - rho <X,Y>, ||Y||_F^2 <= r
% min_{Y} 0.5 ||Y||_F^2 + mu*norm(Y,1) - rho <X,Y>, ||Y||_F^2 <= r
% min_{Y} 0.5 ||Y - rho*X||_F^2 + mu*norm(Y,1), ||Y||_F^2 <= r
Y = prox_l1_ball2(rho*X,mu,r);
fobj = mdot(X,A*X) + mu*sum(abs(Y(:))) + rho*(r-mdot(X,Y));
grad = 2*A*X - rho*Y;






function [X] = ConcaveMinimization2(X,A,B,time_limit)
% min_{X} trace(X'AX) + <X,B>, sigma(X)<=1
t1 = clock();
fobj_old = 1e100;
maxiter = 10000;

for iter=1:maxiter
    if(etime(clock(),t1) > time_limit),break;end
    
    AX = A*X;
    fobj  = mdot(X,AX) + mdot(X,B);
    grad = 2*AX + B;
    
    % min_X <X, grad> , s.t. sigma(X)<=1
    % min_X <X, grad>, s.t. sigma(X) = 1
    % min_X <X, grad> + 0.5||X||_F^2, s.t. sigma(X) = 1
    % min_X 0.5||X + grad||_F^2, s.t. sigma(X) = 1
    X = proj_orth(-grad);
    
    %    fprintf('iter:%d, fobj:%f\n',iter,fobj);
    histroy(iter) = fobj;
    
    
    rel_change = abs((fobj_old - fobj) / max(1,fobj_old));
    if(iter>10 && rel_change<1e-5)
        break;
    end
    fobj_old = fobj;
    
    
end
% plot(histroy)
% ddd
function [X_best,his]=AccerlatedProximalGradient_ConcaveMinimization1(X,A,B,mu,r,time_limit)
% min_{X} trace(X'AX) + mu*norm(X,1) + <X,B>, s.t. ||X||_F^2 <= r
% min_{Y} <X-Xt, grad_X> + mu*norm(X,1), s.t. ||X||_F^2 <= r
  
L = 1;
[n,r]=size(X);
flag=0;

Xp=X;
XXp=zeros(n,r);
alpha=1; S=X;
X_best = X;
HandleObjSmooth = @(X)ComputeObj_smooth(X,A,B);
HandleObjNonSmooth = @(X)mu*norm(X(:),1);
tot = 1e-5;
 his = [];
f_best = HandleObjSmooth(X)+ HandleObjNonSmooth(X);
histroy(1)=f_best;
memory = 10;
t1 = clock();
for iter=1:1000
    if(etime(clock(),t1) > time_limit),break;end
    [f_old,g_old] = HandleObjSmooth(S);
    Xp=X;
    max_in = 10000;
    for in=1:max_in,
        V=S-g_old/L;
        % min_{x} 0.5 L ||x-(xt-g/L)||^2 + mu*norm(X,1), s.t. ||X||_F^2 <= r
        % min_{x} 0.5 ||x-V||^2 + mu/L*norm(X,1), s.t. ||X||_F^2 <= r
        [X]=prox_l1_sphere(V,mu/L,r);
        V=X-S;
        r_sum=mdot(V,V);
        f_new = HandleObjSmooth(X);
        l_sum = f_new - f_old - mdot(g_old,X-S);
        if (r_sum <=1e-100)
            flag=1; % this shows that, the gradient step makes little improvement
            break;
        end
        if(l_sum <= 0.5*r_sum*L)
            break;
        else
            %             L=max(2*L,l_sum/r_sum);
            L=2*L;
        end

        if(in==max_in)
            fprintf('warning! Lipschitz too large!');
        end
    end
       
    alphap=alpha; alpha= (1+ sqrt(4*alpha*alpha +1))/2;
    beta=(alphap-1)/alpha;
    S = X + beta* XXp;
    XXp = X-Xp;
    f_curr = f_new  + HandleObjNonSmooth(X);
    if(f_curr<f_best)
        f_best = f_curr;
        X_best = X;
    end

    
    histroy(iter+1)=f_curr;
    
    FDiff = abs(histroy(iter) - histroy(iter+1)) / (1+ abs((histroy(iter))));
    %  XDiff = s_norm / sqrt(n);
    if iter <= memory
        stop_seq_f(iter) = FDiff;
        %                 stop_seq_x(iter) = XDiff;
    else
        stop_seq_f  = [stop_seq_f(2:end) FDiff];
        %                 stop_seq_x  = [stop_seq_x(2:end); XDiff];
    end
    
    %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
    % last_k_xtol=mean(stop_seq_x);
    last_k_ftol=mean(stop_seq_f);
    if (last_k_ftol <tot)
        if(histroy(end)<histroy(1)),
            break;
        end
    end
    

    
    his(iter) = f_curr;
    %     if (iterStep>50 && flag),break;end
end

% his = his(:);
% plot(his)
% ddd
function [X] = ConcaveMinimization1(X,A,B,mu,r,time_limit)
% min_{X} trace(X'AX) + mu*norm(X,1) + <X,B>, s.t. ||X||_F^2 <= r
% min_{Y} <X-Xt, grad_X> + mu*norm(X,1), s.t. ||X||_F^2 <= r


% HandleObj = @(x)HandleObjSmooth(x)+ HandleObjNonSmooth(x);

% histroy(1)=f_best;

t1 = clock();
fobj_old = 1e100;
maxiter = 10000;
for iter=1:maxiter
    if(etime(clock(),t1) > time_limit),break;end
    AX = A*X ;
    fobj_smooth = mdot(X,AX) + mdot(X,B);
    grad_smooth = 2*AX + B;
    fobj_nonsmooth = mu*norm(X(:),1);
    
    X = prox_l1_sphere(-grad_smooth,mu,r);
    
    % min_X <X, grad> + mu*norm(X,1), s.t. ||X||_F^2 <= r
    % min_X <X, grad> + mu*norm(X,1), s.t. ||X||_F^2 = r
    % min_X <X, grad> + 0.5||X||_F^2 + mu*norm(X,1), s.t. ||X||_F^2 = r
    % min_X 0.5||X + grad||_F^2 + mu*norm(X,1), s.t. ||X||_F^2 = r
    
    
    
    fobj = fobj_smooth + fobj_nonsmooth;
    %       fprintf('iter:%d, fobj:%f\n',iter,fobj);
    histroy(iter) = fobj;
    rel_change = abs((fobj_old - fobj) / max(1,fobj_old));
    if(iter>10 && rel_change<1e-5)
        break;
    end
    fobj_old = fobj;
end



function [flag] = CheckSmoothConstant(beta,fx,fy,x,y,grad_y)
% if f(x) - f(y) - <x-y, grad_y> - 0.5 beta ||x-y||_2^2 <=0
% then f is beta-smooth
x_y = x-y;
left = fx - fy - mdot(x_y,grad_y);
right = 0.5*beta*mdot(x_y,x_y);
if(left - right<=0)
    flag = 1;
else
    flag = 0;
end




function [x, histroy]=SpectralGradient_Monotone(x,HandleObj,HandlePro,Lip,tol)

maxIter = 150;

% opts.xtol = 1e-5;
% opts.gtol = 1e-5;
% opts.ftol = 1e-6;

[n,k]=size(x);

% opts.maxIter=min(opts.maxIter,1000);

memory=15;
stop_seq_f=1e10*ones(memory,1); % store (abs(histroy(iter-1) - histroy(iter)) / (1+ abs((histroy(iter-1))))

M = 10;
% alpha_max = 1/Lip;
% alpha_min = alpha_max/10000;

alpha_max =   10000;
alpha_min = 1/10000;

gama = 1e-5;
sita1=0.01;
sita2=0.99;

% alpha_min = 1e-15;
% alpha_max = 1e15;

hist=[];histroy=[];
timebegin=cputime;

[F,G]=HandleObj(x);
histroy(1)=F;


alpha=1;




%% The main program
for iter=1:maxIter
    
    D = HandlePro(x-alpha*G) - x;
    
    %%%%%%%% Line Search to find optimal step lambda %%%%%%%%
    tend=(iter);
    tbegin =max(1,iter - M +1);
    %      fprintf('iter:%d, begin:%d->end:%d\n',iter,tbegin,tend);
    f_max = max(histroy(tbegin : tend));
    
    x_plus = x + D;
    yita = sum(dot(G,D,1)); lambda =1;
    
    for inner=1:100
        [F_plus,G_plus]=HandleObj(x_plus);
        out = F_plus - f_max - gama * lambda*yita;
        if(out<=0 || lambda<=1e-12),break;end
        lambda_temp = (-0.5 * lambda*lambda*yita) / (F_plus - f_max -  lambda*yita);
        if(lambda_temp>=sita1 && lambda_temp <= sita2*lambda)
            lambda=lambda_temp;
        else
            lambda=lambda/2;
        end
        x_plus = x + lambda*D;
    end
    
    %%%%%%%% Line Search to find optimal step lambda %%%%%%%%
    x = x_plus;
    s = lambda*D;
    s_norm = norm(s,'fro');% s_norm=diff_norm, s_norm = sqrt(tr(s's))
    y = G_plus - G;
    G = G_plus;
    histroy(iter+1)=F_plus;
    hist(iter+1)=cputime-timebegin;
    b = sum(dot(s,y,1));
    if(b<=0)
        alpha=alpha_max;
    else
        alpha_temp = s_norm^2;
        alpha = min(alpha_max,max(alpha_min,alpha_temp/b));
    end
    
    FDiff = abs(histroy(iter) - histroy(iter+1)) / (1+ abs((histroy(iter))));
    %  XDiff = s_norm / sqrt(n);
    if iter <= memory
        stop_seq_f(iter) = FDiff;
        %                 stop_seq_x(iter) = XDiff;
    else
        stop_seq_f  = [stop_seq_f(2:end); FDiff];
        %                 stop_seq_x  = [stop_seq_x(2:end); XDiff];
    end
    % sqrt(lambda)
    % norm(D,'fro')-(s_norm/sqrt(lambda))
    %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
    % last_k_xtol=mean(stop_seq_x);
    last_k_ftol=mean(stop_seq_f);
    if (iter>10 && last_k_ftol < tol)
        if(histroy(end)<histroy(1)),
            break;
        end
    end
    %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
    
end



function [X, histroy]=GradientMethod(X,HandleObj,HandlePro,Lip,tol,rho,mu,r,A)

maxIter = 200;

% opts.xtol = 1e-5;
% opts.gtol = 1e-5;
% opts.ftol = 1e-6;

[n,k]=size(X);

% opts.maxIter=min(opts.maxIter,1000);

memory=15;
stop_seq_f=1e10*ones(memory,1); % store (abs(histroy(iter-1) - histroy(iter)) / (1+ abs((histroy(iter-1))))


hist=[];histroy=[];
timebegin=cputime;

[F,G]=HandleObj(X);
histroy(1)=F;
HandleProx = @(X,stepsize)proj_orth_app(X);
%% The main program
for iter=1:maxIter
    
    Y = prox_l1_ball2(rho*X,mu,r);
    
    % grad = 2*A*X - rho*Y;
    % X = X - grad/Lip;
    % X = HandleProx(X,1/Lip);
    
    HandleObjSmooth = @(X)ComputeObjNesterov(X,A,rho,Y);
    HandleObjNonSmooth = @(X)0;
    [X]=AccerlatedProximalGradient(X,HandleObjSmooth,HandleObjNonSmooth,HandleProx,1e-4);
    
    % plot(his1)
    % pause
    fobj = trace(X'*A*X) + mu*sum(abs(Y(:))) + rho*(r-mdot(X,Y));
    
    histroy(iter+1)=fobj;
    
    FDiff = abs(histroy(iter) - histroy(iter+1)) / (1+ abs((histroy(iter))));
    %  XDiff = s_norm / sqrt(n);
    if iter <= memory
        stop_seq_f(iter) = FDiff;
        %                 stop_seq_x(iter) = XDiff;
    else
        stop_seq_f  = [stop_seq_f(2:end); FDiff];
        %                 stop_seq_x  = [stop_seq_x(2:end); XDiff];
    end
    % sqrt(lambda)
    % norm(D,'fro')-(s_norm/sqrt(lambda))
    %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
    % last_k_xtol=mean(stop_seq_x);
    last_k_ftol=mean(stop_seq_f);
    if (last_k_ftol < tol)
        if(histroy(end)<histroy(1)),
            break;
        end
    end
    %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
    
end
% figure; plot(histroy)
% pause
%   if(~checkdec(histroy)),
% %        error('NonDesc');
%   end
%    if(histroy(end)>histroy(1))
%        histroy
%        plot(histroy)
%        error('NonDesc');
%   end
% plot(histroy)
% pause
function [fobj,grad] = ComputeObjNesterov(X,A,rho,Y)
fobj = trace(X'*A*X) - rho*mdot(X,Y);
grad = 2*A*X - rho*Y;

function [x_best,his]=AccerlatedProximalGradient(x,HandleObjSmooth,HandleObjNonSmooth,HandleProx,tot)
% This program solves the following optimization problem:
% f(x) + g(x)
% where we assume that f is smooth g is non-smooth
% HandleObjSmooth:           x   ->  [fobj,grad]
% HandleObjNonSmooth:        x   ->  [fobj]
% HandleProx:          [theta,a] ->  arg min_{x} 0.5 theta || x - a ||^2 + g(x)

% One xample:

% function example_LeastR
% clear, clc;
% %  min  1/2 || A x - y||^2 + lambda * ||x||_1
% % f(x) + g(x)
% % 0.5 L ||x-xt||^2 + <x-xt,g> + g(x)
% % 0.5 L ||x-(xt-g/L)||^2 + g(x)
% % proximal mapping:
%
% % 0.5 theta ||x - a||^2 + g(x)
%
%
% m=1000;  n=100;    % The data matrix is of size m x n
% A=randn(m,n);       % the data matrix
% y = randn(m,1);
% lambda=0.2;
% HandleObjSmooth = @(x)computeObj(x,A,y);
% HandleObjNonSmooth = @(x)lambda*sum(abs(x));
% x=zeros(n,1);
% HandleProx = @(theta,a)computeprox(theta,a,lambda);
% [x1, his]= AccerlatedProximalGradient(x,HandleObjSmooth,HandleObjNonSmooth,HandleProx);
% plot(his)
%
% function [fobj,grad] = computeObj(x,A,y)
% diff = A*x-y;
% fobj = 1/2*norm(diff)^2 ;
% grad = A'*diff ;
%
% function [x] = computeprox(theta,a,lambda)
% % 0.5 theta ||x - a||^2 + g(x)
% [x] = threadholding_l1(a,lambda/theta);
%
% function [x] = threadholding_l1(a,lambda)
% % solving the following OP:
% % min_{x} 0.5 ||x - a||^2 + lambda * sum(abs(x))
% x = sign(a).*max(0,abs(a)-lambda);

% last modified: 2016-01-29


[n,d]=size(x);
flag=0;

global L;

if(isempty(L))
    L=1;
end

xp=x;
xxp=zeros(n,d);
alpha=1; s=x;
x_best = x;
f_best = HandleObjSmooth(x)+ HandleObjNonSmooth(x);
histroy(1)=f_best;
memory=10;
for iter=1:1000,
    %     fprintf('*');
    [f_old,g_old] = HandleObjSmooth(s);
    xp=x;
    max_in = 10000;
    for in=1:max_in,
        v=s-g_old/L;
        % min_{x} 0.5 L ||x-(xt-g/L)||^2 + z * ||x||_1
        [x]=HandleProx(v,L);
        v=x-s;
        r_sum=mdot(v,v);
        f_new = HandleObjSmooth(x);
        l_sum = f_new - f_old - mdot(g_old,x-s);
        if (r_sum <=1e-100)
            flag=1; % this shows that, the gradient step makes little improvement
            break;
        end
        if(l_sum <= 0.5*r_sum*L)
            break;
        else
            %             L=max(2*L,l_sum/r_sum);
            L=2*L;
        end
        if(in==max_in)
            fprintf('warning! Lipschitz too large!');
        end
    end
    
    alphap=alpha; alpha= (1+ sqrt(4*alpha*alpha +1))/2;
    beta=(alphap-1)/alpha;
    s = x + beta* xxp;
    xxp = x-xp;
    f_curr = f_new  + HandleObjNonSmooth(x);
    if(f_curr<f_best)
        f_best = f_curr;
        x_best = x;
    end
    
    
    histroy(iter+1)=f_curr;
    
    FDiff = abs(histroy(iter) - histroy(iter+1)) / (1+ abs((histroy(iter))));
    %  XDiff = s_norm / sqrt(n);
    if iter <= memory
        stop_seq_f(iter) = FDiff;
        %                 stop_seq_x(iter) = XDiff;
    else
        stop_seq_f  = [stop_seq_f(2:end) FDiff];
        %                 stop_seq_x  = [stop_seq_x(2:end); XDiff];
    end
    
    %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
    % last_k_xtol=mean(stop_seq_x);
    last_k_ftol=mean(stop_seq_f);
    if (last_k_ftol <tot)
        if(histroy(end)<histroy(1)),
            break;
        end
    end
    
    
    
    his(iter) = f_curr;
    %     if (iterStep>50 && flag),break;end
end
% his = his(:);



function [X, histroy,iter,hist]=SpectralGradient(X,HandleObj,HandleProx,Lip,tol,A,mu,rho,r)

MaxIter=100;


[n,k]=size(X);



memory = 10; M = 1;  alpha_max = 1/Lip;

gama = 0.25;


hist=[];histroy=[];
timebegin=cputime;

[F,G]=HandleObj(X);
histroy(1)=F;
hist(1)=cputime-timebegin;
stop_seq_f = [];
stop_seq_x = [];

alpha = alpha_max;
L = 1/alpha;
Y = prox_l1_sphere(rho*X,mu,r);
%% The main program
for iter=1:MaxIter
    
    Y = prox_l1_sphere(rho*X,mu,r);
    
    
    fobj = trace(X'*A*X) + mu*sum(abs(Y(:))) + rho*(r-mdot(X,Y));
    grad = 2*A*X - rho*Y;
    X_old = X;
    %     [f_last,g_last]=HandleObj(X);
    X  = HandleProx(X - grad/L,1/L);
    %     f_max = histroy(end);
    histroy(iter+1) = fobj;
    %     L = 1/alpha;
    %     for inner=1:1000000
    %         x_plus  = HandleProx(x - g_last/L,1/L);
    %         [f_curr,G_plus]=HandleObj(x_plus);
    %         diff = x_plus-x;  % the difference between the new approximate solution x
    %         r_sum1 = 0.5*sum(dot(diff,diff,1));
    %         l_sum1 = f_curr - f_last - sum(dot(diff,G_plus,1));
    %         if(l_sum1 - r_sum1 * L <=0)
    %             break;
    %         end
    %         L = 2*L;
    %     end
    
    diff_norm = norm(X - X_old,'fro');
    %     %        fprintf('%.10f\n',F_plus);
    %     %%%%%%%% Line Search to find optimal step lambda %%%%%%%%
    %     s = x_plus-x;
    %     x = x_plus;
    %     s_norm = norm(s,'fro');% s_norm=diff_norm, s_norm = sqrt(tr(s's))
    %     y = G_plus - g_last;
    
    %     %         hist(iter+1)=cputime-timebegin;
    %     b = sum(dot(s,y,1));
    %
    %     if(b<=0)
    %         alpha=alpha_max;
    %     else
    %         %             alpha_temp = trace (s'*s);
    %         alpha_temp = s_norm^2;
    %         alpha = min(alpha_max,max(alpha_max/1000,alpha_temp/b));
    %     end
    
    FDiff = abs(histroy(iter) - histroy(iter+1)) / (1+ abs((histroy(iter))));
    XDiff = diff_norm / sqrt(n);
    
    if iter <= memory
        stop_seq_f(iter) = FDiff;
        stop_seq_x(iter) = XDiff;
    else
        stop_seq_f  = [stop_seq_f(2:end) FDiff];
        stop_seq_x  = [stop_seq_x(2:end) XDiff];
    end
    
    %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
    last_k_xtol=mean(stop_seq_x);
    last_k_ftol=mean(stop_seq_f);
    if  all( [last_k_ftol] < [tol])
        break; %diff_norm < tol*0.1 || last_k_xtol
    end
    
end

function [x, histroy,iter,hist]=SpectralGradient2(X,HandleObj,HandleProx,Lip,tol,A,mu,rho,r)

MaxIter=100;


[n,k]=size(X);



memory = 10; M = 1;  alpha_max = 1/Lip;

gama = 0.25;


hist=[];histroy=[];
timebegin=cputime;

[F,G]=HandleObj(X);
histroy(1)=F;
hist(1)=cputime-timebegin;
stop_seq_f = [];
stop_seq_x = [];

alpha = alpha_max;
L = 1/alpha;
%% The main program
for iter=1:MaxIter
    
    [f_last,g_last]=HandleObj(X);
    X  = HandleProx(X - g_last/L,1/L);
    %     f_max = histroy(end);
    histroy(iter) = f_last;
    %     L = 1/alpha;
    %     for inner=1:1000000
    %         x_plus  = HandleProx(x - g_last/L,1/L);
    %         [f_curr,G_plus]=HandleObj(x_plus);
    %         diff = x_plus-x;  % the difference between the new approximate solution x
    %         r_sum1 = 0.5*sum(dot(diff,diff,1));
    %         l_sum1 = f_curr - f_last - sum(dot(diff,G_plus,1));
    %         if(l_sum1 - r_sum1 * L <=0)
    %             break;
    %         end
    %         L = 2*L;
    %     end
    
    
    %     %        fprintf('%.10f\n',F_plus);
    %     %%%%%%%% Line Search to find optimal step lambda %%%%%%%%
    %     s = x_plus-x;
    %     x = x_plus;
    %     s_norm = norm(s,'fro');% s_norm=diff_norm, s_norm = sqrt(tr(s's))
    %     y = G_plus - g_last;
    
    %     %         hist(iter+1)=cputime-timebegin;
    %     b = sum(dot(s,y,1));
    %
    %     if(b<=0)
    %         alpha=alpha_max;
    %     else
    %         %             alpha_temp = trace (s'*s);
    %         alpha_temp = s_norm^2;
    %         alpha = min(alpha_max,max(alpha_max/1000,alpha_temp/b));
    %     end
    
    %     FDiff = abs(histroy(iter) - histroy(iter+1)) / (1+ abs((histroy(iter))));
    %     XDiff = s_norm / sqrt(n);
    %
    %     if iter <= memory
    %         stop_seq_f(iter) = FDiff;
    %         stop_seq_x(iter) = XDiff;
    %     else
    %         stop_seq_f  = [stop_seq_f(2:end) FDiff];
    %         stop_seq_x  = [stop_seq_x(2:end) XDiff];
    %     end
    %
    %     %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
    %     last_k_xtol=mean(stop_seq_x);
    %     last_k_ftol=mean(stop_seq_f);
    %     if s_norm < tol*0.1 || all( [last_k_xtol,last_k_ftol] < [tol, tol])
    %         break;
    %     end
    %     %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
    %
end
figure;      plot(histroy)
pause
% pause
%
function [X] = ExactPenaltyF1(A,mu,r,X0,max_iter)
%min Tr(X'*A*X) + mu*norm(X,1) s.t. X'*X=Ir. X \in R^{n*r}
% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X} trace(X'AX) + mu*norm(X,1), ||X||_F \leq sqrt{r}, svd(X)==r
% min_{X} trace(X'AX) + mu*norm(X,1) + rho (r -||X||_* ), s.t. ||X||_F \leq sqrt{r}
% min_{X,Y} trace(X'AX) + mu*norm(X,1) + rho (r-<X,Y>), s.t. ||X||_F \leq sqrt{r}, sigma(Y)<=1


[n]=size(A,1);
% maxeigA = max(abs(eig(A)));
maxeigA = abs(eigs(A,1));
maxrho = 5000;

rho = 1;%rho = 5000;
A = A + eye(n)*maxeigA*2;
small = abs(eigs(A,1,'smallestabs'));
large = abs(eigs(A,1));

X = X0;
% X = proj_l2(randn(n,r),sqrt(r));

Lip = abs(eigs(A,1))*2;

% Lip = 1000;
eps1 = 1e-5;
HandleObjX = @(X)trace(X'*A*X) + mu*sum(abs(X(:))) + rho*(r - sum(svd(X)) );
HandleObj  = @(X)trace(X'*A*X) + mu*sum(abs(X(:)));

for iter = 1:100
    rho = 1000;
    % if(0==sum(abs(X(:))) || ~mod(iter,10)),rho = min(maxrho,rho * 10);end
    HandleObj = @(X)ComputeObj22(X,A,mu,rho,r);
    HandleProx = @(A,stepsize)prox_l1_ball(A,mu*stepsize,r);
    X = SpectralGradient(X,HandleObj,HandleProx);
    fprintf('iter:%d, fobj:%f\n',iter,HandleObj(proj_orth(X)));
    X'*X
end


X = proj_orth(X);

function [fobj,grad] = ComputeObj22(X,A,mu,rho,r)
[U,D,V]=svd(X,0);
Y = U*V';
fobj = trace(X'*A*X) + mu*sum(abs(X(:))) + rho*(r-mdot(X,Y));
grad = 2*A*X - rho*Y;

function [x, histroy]=ProximalPointGradient(x,HandleObj,HandleProx,Lip)

MaxIter=100;

alpha = 1/Lip;
for iter=1:MaxIter
    [fobj,grad] = HandleObj(x);
    x = HandleProx(x-alpha*grad,alpha);
    histroy(iter) = fobj;
end
figure;      plot(histroy)
pause(1)

function [X] = ExactPenalty11(A,mu,r,X0,max_iter)
%min Tr(X'*A*X) + mu*norm(X,1) s.t. X'*X=Ir. X \in R^{n*r}
% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X} trace(X'AX) + mu*norm(X,1), ||X||_F \leq sqrt{r}, svd(X)==r
% min_{X} trace(X'AX) + mu*norm(X,1) + rho (r -||X||_* ), s.t. ||X||_F \leq sqrt{r}
% min_{X,Y} trace(X'AX) + mu*norm(X,1) + rho (r-<X,Y>), s.t. ||X||_F \leq sqrt{r}, sigma(Y)<=1

[n]=size(A,1);
% maxeigA = max(abs(eig(A)));
maxeigA = abs(eigs(A,1));
maxrho = 5000;

rho = 1;rho = 5000;
A = A + eye(n)*maxeigA*2;
small = abs(eigs(A,1,'smallestabs'));
large = abs(eigs(A,1));

X = X0;
% X = proj_l2(randn(n,r),sqrt(r));

Lip = abs(eigs(A,1))*2;

% Lip = 1000;
eps1 = 1e-5;
HandleObjX = @(X)trace(X'*A*X) + mu*sum(abs(X(:))) + rho*(r - sum(svd(X)) );
HandleObj  = @(X)trace(X'*A*X) + mu*sum(abs(X(:)));

for iter = 1:max_iter
    
    %     if(0==sum(abs(X(:))) || ~mod(iter,100)),rho = min(maxrho,rho * 2);end
    [U,D,V]=svd(X,0);
    Y = U*V';
    B = -rho*Y;
    %     if(~mod(iter,100)) rho = min(10,rho * 2);end
    % trace(X'AX) + mu*norm(X,1) - rho <X,Y>, s.t. ||X||_F \leq sqrt{r}
    %     old_X = X;
    %     Y = X + beta *(X-old_X);
    % min_X trace(X'*A*X) + mu*sum(abs(X(:))) + mdot(X,B)
    X = SolveConvexSubproblem(X,A,B,mu,Lip,small,large);
    
    % min_X 0.5||X-A||_{fro}^2 + lambda ||X||_1, s.t. ||X||_F <= sqrt(r)
    his (iter) = HandleObjX(X);
    %     fprintf('iter:%d, fobj:%f\n',iter,HandleObj(OrthProj(X)));
end

X = proj_orth(X);



function [X] = ExactPenalty_lp(A,mu,r,X0,max_iter)

%min Tr(X'*A*X) + mu*norm(X,1) s.t. X'*X=Ir. X \in R^{n*r}
% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X} trace(X'AX) + mu*norm(X,1), ||X||_F \leq sqrt{r}, svd(X)==r
% min_{X} trace(X'AX) + mu*norm(X,1) + rho sqrt(r + eps1 -||X||_* ), s.t. ||X||_F \leq sqrt{r}


[n]=size(A,1);
% maxeigA = max(abs(eig(A)));
maxeigA = abs(eigs(A,1));
maxrho = 2* (mu*sqrt(n*r) + sqrt(r) * maxeigA);
maxrho = 5000;

rho = 1000.01;
A = A + eye(n)*maxeigA*2;

X = X0;
% X = proj_l2(randn(n,r),sqrt(r));

Lip = abs(eigs(A,1))*2;

% Lip = 1000;
eps1 = 1e-5;
HandleObjX = @(X)trace(X'*A*X) + mu*sum(abs(X(:))) + rho*sqrt(r + eps1 - sum(svd(X)) );
HandleObj  = @(X)trace(X'*A*X) + mu*sum(abs(X(:)));

for iter = 1:max_iter
    
    %     if(0==sum(abs(X(:))) || ~mod(iter,10)),rho = min(maxrho,rho * 2);end
    [U,D,V]=svd(X,0);
    
    
    sss = -2*sqrt(r+eps1-sum(diag(D)));
    subgrad = (rho/sss)*U*V';
    
    %     if(~mod(iter,100)) rho = min(10,rho * 2);end
    % trace(X'AX) + mu*norm(X,1) + rho <X,subgrad>, s.t. ||X||_F \leq sqrt{r}
    %     old_X = X;
    %     Y = X + beta *(X-old_X);
    X = SolveConvexSubproblem(X,A,subgrad,mu,Lip);
    
    
    % min_X 0.5||X-A||_{fro}^2 + lambda ||X||_1, s.t. ||X||_F <= sqrt(r)
    his (iter) = HandleObjX(X);
    %       fprintf('iter:%d, fobj:%f\n',iter,HandleObj(OrthProj(X)));
end

X = proj_orth(X);

%  plot(his)
function [X] = SolveConvexSubproblem(X,A,B,mu,Lip,small,large)
% It solves the following problem:
% min_X trace(X'*A*X) + mu*sum(abs(X(:))) + mdot(X,B)
% s.t. trace(X'*X) <= r

% addpath('G:\cvx');
[n,r] = size(X);

% cvx_begin quiet
% variables X
% minimize( trace(X'*A*X) + mu*sum(abs(X(:))) + trace(X'*B) )
% subject to
% trace(X'*X) <= r
% cvx_end
% X
% return;
HandleObjConvex= @(X)trace(X'*A*X) + mu*sum(abs(X(:))) + mdot(X,B); %
grad = 2*A*X + B;
Xbar = prox_l1_ball(X - grad / Lip,mu/Lip,r);
Gbar = @(X)2*A*X + B;
alpha = sqrt(small/large);
for in = 1:130
    X_old = X;
    X = prox_l1_ball(Xbar - Gbar(Xbar) / Lip,mu/Lip,r);
    Xbar = X + (1-alpha)/(1+alpha)*(X-X_old);
    his(in)= HandleObjConvex(X_old);
    if(in>2&&norm(X-X_old,'fro')<1e-12),break;end
end
X = X_old;

function [X] = SolveConvexSubproblem_nesterov(X,A,B,mu,Lip,small,large)
% It solves the following problem:
% min_X trace(X'*A*X) + mu*sum(abs(X(:))) + mdot(X,B)
% s.t. trace(X'*X) <= r

% addpath('G:\cvx');
[n,r] = size(X);

% cvx_begin quiet
% variables X
% minimize( trace(X'*A*X) + mu*sum(abs(X(:))) + trace(X'*B) )
% subject to
% trace(X'*X) <= r
% cvx_end
% X
% return;
HandleObjConvex= @(X)trace(X'*A*X) + mu*sum(abs(X(:))) + mdot(X,B); %
grad = 2*A*X + B;
Xbar = prox_l1_ball(X - grad / Lip,mu/Lip,r);
Gbar = @(X)2*A*X + B;
alpha = sqrt(small/large);
for in = 1:130
    X_old = X;
    X = prox_l1_ball(Xbar - Gbar(Xbar) / Lip,mu/Lip,r);
    Xbar = X + (1-alpha)/(1+alpha)*(X-X_old);
    his(in)= HandleObjConvex(X_old);
    if(in>2&&norm(X-X_old,'fro')<1e-12),break;end
end
X = X_old;


% HandleObjConvex= @(X)trace(X'*A*X) + mu*sum(abs(X(:))) + mdot(X,B); %
%     for in = 1:130
% grad = 2*A*X + B;
% X_old = X;
% X = prox_l1_ball(X - grad / Lip,mu/Lip,r);
% if(norm(X-X_old,'fro')<1e-12),break;end
% %      fs(in)=HandleObjConvex(X);
%     end


%        plot(fs)
%      pause(1)
% dddd







function [f,g] = ComputeObj_smooth(X,A,B)
AX = A*X;
f = mdot(X,AX) + mdot(X,B);
g = 2*AX + B;






function [X,histroy,ts] = DCA2_AdaptiveNesterov_simple(A,mu,r,X0,max_iter,time_limit)

% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X,Y} trace(X'AX) + mu*norm(X,1), sigma(Y)<=1, ||X||_F^2 <= r, <X,Y> = r
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2), sigma(X)<=1

% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (0.5 r-<X,Y>+0.5||Y||_F^2)

% ||2*A*X + mu sign(X)||_F 
% 2||AX||_F + mu ||sign(X)||_F
% 2*normA*sqrt(r) +  mu*sqrt(nr)
X0 = OrthProj(X0);
X = X0;
 
% A = A + abs(laneig((A+A')/2,1))*eye(size(A,1));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);

% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;



nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
rho_max = 2*normA*sqrt(r) + mu*sqrt(nr);
% rho_max  = rho_max * 10;

% rho = rho_max/(scale^20); %scale = 1;
% % rho = rho_max ;scale = 1;
% rho0 = 0.01;
% beta = rho_max; 
rho = 1;
%  rho = rho_max;
ts = [];
histroy = [];
Y = X;
% HandleFun = @(X,Y,rho)trace(X'*A*X) + mu*norm(Y,1) + rho*(r-2*mdot(X,Y)+norm(Y,'fro')^2);
% last_obj = HandleFun(X,Y,rho);
% curr_obj = last_obj;
restate = 0;
for iter = 1:max_iter
 

    % update Y
    % min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (0.5r-<X,Y>+0.5||Y||_F^2)
    % min_{Y} mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2)
    % min_{Y} mu*norm(Y,1) + rho ||Y-X||_F^2 
    % min_{Y} 0.5 mu/rho*norm(Y,1) + 0.5||Y-X||_F^2 

    [X,Y] = ComputeSubProbSimple(X,A,mu,rho,normA,r);

%     if ((norm(X-X_old,'fro')<1e-5))% && (restate>=10)) || (restate>=50)

     dist = 0.5*r - mdot(X,Y)+0.5*mdot(Y,Y);
     if(dist>1e-7)
    rho = min(1e10,rho*2);
     end
  
    true_fobj = HandleObjTrue(X);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    %fprintf('iter:%d, dist:%f, tfobj:%f, beta:%f\n',iter,dist,true_fobj,beta);
    fprintf('iter:%d, dist: %e, fobj:%e, rho:%e\n',iter,dist,true_fobj,rho);
    histroy =[histroy;true_fobj];
          
              if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
              end
    
              cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
         break;
    end



end
X = OrthProj(Best_X);



function [X,histroy,ts] = DCA2_AdaptiveNesterov(A,mu,r,X0,max_iter,time_limit)

% min_{X} trace(X'AX) + mu*norm(X,1), X is orth
% min_{X,Y} trace(X'AX) + mu*norm(X,1), sigma(Y)<=1, ||X||_F^2 <= r, <X,Y> = r
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2), sigma(X)<=1

% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (0.5 r-<X,Y>+0.5||Y||_F^2)

% ||2*A*X + mu sign(X)||_F 
% 2||AX||_F + mu ||sign(X)||_F
% 2*normA*sqrt(r) +  mu*sqrt(nr)
X0 = OrthProj(X0);
X = X0;
 
% A = A + abs(laneig((A+A')/2,1))*eye(size(A,1));
HandleObjTrue  = @(X)ComputeObj(X,A,mu);

% histroy(1) = HandleObjTrue(X);
Best_X = X;
Best_X_f = HandleObjTrue(X);
t00000 = clock();
tttt1 = clock();
each = time_limit/150;
scale = 2;



nr = size(X,1)* size(X,2);
normA = abs(laneig((A+A')/2,1));
rho_max = 2*normA*sqrt(r) + mu*sqrt(nr);
% rho_max  = rho_max * 10;

% rho = rho_max/(scale^20); %scale = 1;
% % rho = rho_max ;scale = 1;
% rho0 = 0.01;
% beta = rho_max; 
rho = 0.01;
%  rho = rho_max;
ts = [];
histroy = [];
Y = X;
% HandleFun = @(X,Y,rho)trace(X'*A*X) + mu*norm(Y,1) + rho*(r-2*mdot(X,Y)+norm(Y,'fro')^2);
% last_obj = HandleFun(X,Y,rho);
% curr_obj = last_obj;
restate = 0;
for iter = 1:max_iter
 

 
    % update Y
    % min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (0.5r-<X,Y>+0.5||Y||_F^2)
    % min_{Y} mu*norm(Y,1) + rho (r-2<X,Y>+||Y||_F^2)
    % min_{Y} mu*norm(Y,1) + rho ||Y-X||_F^2 
    % min_{Y} 0.5 mu/rho*norm(Y,1) + 0.5||Y-X||_F^2 
   

    [X,Y] = ComputeSubProb(X,A,mu,rho,normA,r);

%   if ((norm(X-X_old,'fro')<1e-5))% && (restate>=10)) || (restate>=50)

  
         dist = 0.5*r - mdot(X,Y)+0.5*mdot(Y,Y);
     if(dist>1e-7)
    rho = min(1e10,rho*2);
     end
     
     
    true_fobj = HandleObjTrue(X);
    % true_fobj = HandleObjPenalty(X,Y,rho);
    %fprintf('iter:%d, dist:%f, tfobj:%f, beta:%f\n',iter,dist,true_fobj,beta);
    fprintf('iter:%d, dist: %f, fobj:%e, rho:%e\n',iter,dist,true_fobj,rho);
    histroy =[histroy;true_fobj];
          
              if(true_fobj< Best_X_f)
        Best_X = X;
        Best_X_f = true_fobj;
              end
    
              cur_t = etime(clock(),t00000);
    ts = [ts;cur_t];
    if (cur_t > time_limit),
         break;
    end



end
X = OrthProj(Best_X);


function [x,his,flag] = NesterovQuadL1Opt(x,A,b,lambda,max_iter,n)
% solve the following OP using proximal point method
% min_{x} 0.5x'Ax + b'x + lambda|x|_1

[eigv]=eig(A);
L = eigv(n);
mu = eigv(1);

if(mu<1e-5),
    flag = 1;
else
    flag = 0;
end

his=[];
x0=x;
y = x;
alpha = 1;
his=[];
HandleObj = @(x) 0.5*x'*A*x + b'*x + lambda*sum(abs(x));
f0 = HandleObj(x);

for iter = 1:max_iter,
    
    fobj = HandleObj(x);
    grad = A*y + b;
    %     rel_change=abs(fobj-fobj_o)/abs(fobj_o);
    %     if(rel_change <1e-12),break;end
    %     fobj_o=fobj;
    his=[his;fobj];
    %     fprintf('iter:%d, fobj:%f\n',iter,fobj);
    x_old = x;
    [x] = threadholding_l1(y-grad/L,lambda/L);
    alpha_o = alpha;
    alpha = ((mu/L - alpha*alpha) + sqrt((alpha*alpha - mu/L)^2 + 4*alpha*alpha))/2;
    beta = alpha_o*(1-alpha_o) / ( alpha_o*alpha_o+alpha);
    diff = x-x_old;
    dist = norm(diff);
    if(dist<1e-12 && iter>=10),break;end
    y = x + beta * diff;
end

f1 = HandleObj(x);
if(f1>f0),
    x=x0;
end



function [X,Y_val] = ComputeSubProb_bak(X,A,prog_mu,rho,normA,r)
% min_{X} trace(X'AX) + <X,B> + rho*||X||_F^2

Y = @(X)prox_l1(X,0.5*prog_mu/(rho));

% update X
% min_{X} trace(X'AX) + rho (r-2<X,Y(X)> + 2||X-Xt||_F^2)
L = 2*normA;% + 4*rho;
% mu = 2*rho;

h_fobj = @(X)mdot(X,A*X) + rho*(r-2*mdot(X,Y(X)));% + 2*rho*norm(X-Xt,'fro')^2;
h_grad = @(X)2*A*X -2*rho*Y(X);% + 4*rho*(X-Xt);


% [X] = AppOrthProj(X-grad/L);

% alpha = sqrt(mu/L);
his = [];
for iter = 1:200
%     fobj = h_fobj(X1);
%     his = [his;fobj];
    X_old = X;
    [X] = AppOrthProj(X-h_grad(X)/L);
    dist = norm(X-X_old,'fro');
    if(dist<1e-3 && iter>10),break;end
end
% figure;plot(his) 
% pause(1)
% ddddd
Y_val = Y(X);

function [X,Y_val] = ComputeSubProbSimple(X,A,prog_mu,rho,normA,r)
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (0.5 r-<X,Y>+0.5||Y||_F^2)
% Y = argmin_{Y} mu*norm(Y,1) + rho (0.5||Y-X||_F^2)
% Y = argmin_{Y} mu/rho*norm(Y,1) + 0.5||Y-X||_F^2

Y = @(X)prox_l1(X,prog_mu/rho);

% update X
% min_{X} trace(X'AX) + rho (r-2<X,Y(X)> + 2||X-Xt||_F^2)
L = 2*normA;% + 4*rho;
% mu = 2*rho;

h_fobj = @(X)mdot(X,A*X) + rho*(0.5*r-mdot(X,Y(X)));% + 2*rho*norm(X-Xt,'fro')^2;
h_grad = @(X)2*A*X - rho*Y(X) ;% + 4*rho*(X-XXXX);

% assign xp with x, and Axp with Ax
Xp = X;  XXp=0*Xp;
alphap=0; alpha=1;

% his = [];
% for iter = 1:200
%     X_old = X;
%     [X] = AppOrthProj(X-h_grad(X)/L);
%     dist = norm(X-X_old,'fro');
%     if(dist<1e-3 && iter>10),break;end
% end

% X1 = AppOrthProj(randn(size(X)));
% X2 = AppOrthProj(randn(size(X)));
% norm(h_grad(X1) - h_grad(X2),'fro') / norm(X1-X2,'fro')
% L
% ddd

his = [];
for iter=1:300

%     S = X + (alphap-1)/alpha*XXp;
% (alphap-1)/alpha
    S = X + 0.9*XXp;
    Xp = X;
    X = AppOrthProj(S-h_grad(S)/L);
%      alphap = alpha; alpha = (1+ sqrt(4*alpha*alpha +1))/2;
    if(norm(X-S,'fro')<1e-3 && iter>10),break;end
    XXp=X-Xp;
%     his(iter) = h_fobj(X);
end

% plot(his)
% ddd
Y_val = Y(X);

function [X,Y_val] = ComputeSubProb(X,A,prog_mu,rho,normA,r)
% min_{X,Y} trace(X'AX) + mu*norm(Y,1) + rho (0.5 r-<X,Y>+0.5||Y||_F^2)
% Y = argmin_{Y} mu*norm(Y,1) + rho (0.5||Y-X||_F^2)
% Y = argmin_{Y} mu/rho*norm(Y,1) + 0.5||Y-X||_F^2

Y = @(X)prox_l1(X,prog_mu/rho);

% update X
% min_{X} trace(X'AX) + rho (r-2<X,Y(X)> + 2||X-Xt||_F^2)
L = 2*normA;% + 4*rho;
% mu = 2*rho;

h_fobj = @(X)mdot(X,A*X) + rho*(0.5*r-mdot(X,Y(X)));% + 2*rho*norm(X-Xt,'fro')^2;
h_grad = @(X)2*A*X - rho*Y(X) ;% + 4*rho*(X-XXXX);

% assign xp with x, and Axp with Ax
Xp = X;  XXp=0*Xp;
alphap=0; alpha=1;

% his = [];
% for iter = 1:200
%     X_old = X;
%     [X] = AppOrthProj(X-h_grad(X)/L);
%     dist = norm(X-X_old,'fro');
%     if(dist<1e-3 && iter>10),break;end
% end

% X1 = AppOrthProj(randn(size(X)));
% X2 = AppOrthProj(randn(size(X)));
% norm(h_grad(X1) - h_grad(X2),'fro') / norm(X1-X2,'fro')
% L
% ddd

his = [];
for iter=1:300
    S = X + (alphap-1)/alpha*XXp;
    Xp = X;
    X = AppOrthProj(S-h_grad(S)/L);
    alphap = alpha; alpha = (1+ sqrt(4*alpha*alpha +1))/2;
    if(norm(X-S,'fro')<1e-3 && iter>10),break;end
    XXp=X-Xp;
%     his(iter) = h_fobj(X);
end

% plot(his)
% ddd
Y_val = Y(X);

function [X,Y_val] = ComputeSubProb11(Xt,A,prog_mu,rho,normA,r)
% min_{X} trace(X'AX) + <X,B> + rho*||X||_F^2

Y = @(X)prox_l1(X,0.5*prog_mu/(rho));


% update X
% min_{X} trace(X'AX) + rho (r-2<X,Y(X)> + 2||X-Xt||_F^2)
L = 2*normA + 4*rho;
mu = 2*rho;

h_grad = @(X)2*A*X -2*rho*Y(X) - 2*rho*(X-Xt);
h_fobj = @(X)mdot(X,A*X) + rho*(r-2*mdot(X,Y(X)) + 2*norm(X-Xt,'fro')^2);
% [X] = AppOrthProj(X-grad/L);


X = AppOrthProj(Xt-h_grad(Xt)/L);
X1 = X;
alpha = sqrt(mu/L);
his = [];
for iter = 1:200

    fobj = h_fobj(X1);
    his = [his;fobj];
    X_old = X;
    [X] = AppOrthProj(X1-h_grad(X1)/L);
%     X1 = X + (1-alpha)/(1+alpha)*(X-X_old);
    X1 = X ;
    
    diff = X-X_old;
    dist = norm(diff,'fro');
%     if(dist<1e-12 && iter>=10),break;end
end
  plot(his)
 


ddddd
Y_val = Y(X);
