function [ W_t ] = AGD_TL( x_t, y_t, x_s, W_t, lambda, eta, beta, T, L )

if isempty(x_s) == 1
    
    lambda = 1;
    
    x_s = x_t(:,1);
    
end

for l = 1 : L
    
    y_s = y_tl( x_s , W_t );
    
    for t = 1 : T
        
        W_pre = W_t;
        
        G = lambda * Gradient_tl( y_t, x_t, W_t) + (1-lambda) * Gradient_tl( y_s, x_s, W_t);
        
        W_t = W_t -  eta * G + beta * (W_t - W_pre) ;
        
    end
    
end

end

