function nn = nnff2(nn, x, y, l)
%NNFF performs a feedforward pass
% nn = nnff(nn, x, y) returns an neural network structure with updated
% layer activations, error and loss (nn.a, nn.e and nn.L)

    n = nn.n;
    m = size(x, 1);

    wc = nn.W{1};
    [tc1,tc2] = size(wc);

    gamma = nn.gamma;
    
    x = [ones(m,1) x];
    nn.a{1} = x;

    %feedforward pass
    for i = 2 : n-1
        switch nn.activation_function 
            case 'sigm'
                if i == 2 
                    %{
                    www1 = nn.W{i - 1}';
                    wv = www1(1,:);
                    www1(1,:) = [];

                    ppppp = sort(www1(:),'descend');
                    [ppppp1,ppppp2] = size(ppppp);

                    tar = ppppp(floor(ppppp1*0.1),1);
                    [wwwww1,wwwww2] = size(www1);
                                            
                    for ii = 1:wwwww1
                        for jj = 1:wwwww2
                            if www1(ii,jj) < tar
                                www1(ii,jj) = 0;
                            end
                        end
                    end
                    %}

                    nn.ww1 = nn.W{i - 1}';

                    nn.a{i} = nn.a{i - 1} * nn.ww1;
                end
                if i == 3
                    nn.a{i} = zeros(m,tc1);

                    for k = 1:m
                        
                        wwww = nn.W{i - 1}(:,2:end);
                        wwwww = nn.W{i - 1}(:,1);

                        [wwww1,wwww2] = size(wwww);
                        for ii = 1:wwww1
                            for jj = 1:wwww2
                                if ii == jj
                                    wwww(ii,jj) = 0;
                                end
                            end
                        end

                        pppp = sort(abs(wwww(:)),'descend');
                        [pppp1,pppp2] = size(pppp);

                        %tar = pppp(pppp1*0.1,1);
                        tar = pppp(floor(pppp1*gamma),1);
                        %tar = 0;
                        %ww = prim(wwww);
                        
                        
                        ww = zeros(wwww1,wwww2);

                        for ii = 1:wwww1
                            for jj = 1:wwww2
                                if abs(wwww(ii,jj)) >= tar
                                    ww(ii,jj) = wwww(ii,jj);
                                end
                            end
                        end

                        ww = [wwwww,ww];
                        nn.ww = ww;
                        

                        %ww = nn.W{i - 1};
                        pp = nn.a{i - 1}(k,:);

                        [Wii, wflag] = connect_module2(abs(ww'));
                        nn.Wii = connect_value(abs(ww'), abs(Wii), wflag);

                        [Wii1,Wii2] = size(Wii);
                        Wii = Wii/(Wii1*Wii2);

                        nn.Wii = Wii;
                        nn.wflag = wflag;

                        z_G = pp(:,2:end);
                        options = optimset('TolFun',0.0001);

                        alpha = nn.weightPenaltyL1;
                        wii = nn.Wii;

                        mx = max(wflag);

                        z = zeros(1,Wii2);
                        zc = cell(mx);

                        if exist('gpuDevice', 'var')
                            gpuDevice = gpuDevice();
                        end
                        parfor mi = 1:mx
                        %for mi = 1:mx
                            %disp(mi);
                            mvec = [0];
                            mpp = [1];
                            [pp1,pp2] = size(wflag);

                            mcol = [];
                            miol = [];
                            for mj = 1:pp2
                                if mi == wflag(1,mj)
                                    mvec = [mvec,mj];
                                    mpp = [mpp,pp(1,mj+1)];
                                    mcol = [mcol;ww(mj,1)];
                                    miol = [miol,wii(mj,1)];
                                end
                            end
                            %mpp = [1,mpp];
                            mvec(:,1) = [];
                            %mpp(:,1) = [];

                            [mc1,mc2] = size(mvec);
                            mww = zeros(mc2,mc2);
                            mwii = zeros(mc2,mc2);
                            
                            for mj = 1:mc2
                                for mk = 1:mc2
                                    mww(mj,mk) = ww(mvec(1,mj), mvec(1,mk)+1);
                                    mwii(mj,mk) = wii(mvec(1,mj)+1, mvec(1,mk));
                                end
                            end

                            mww = [mcol, mww];
                            mwii = [miol; mwii];

                            mz_G = mpp(:,2:end);
                            mz = fsolve(@(xx)root7d(xx,mpp,mww,alpha,mwii), mz_G, options);
                            
                            %for mj = 1:mc2
                            %    z(1,mvec(1,mj)) = mz(1,mj);
                            %end
                            zc{mi} = mz;
                        end

                        zc = gather(zc); 

                        for mi = 1:mx
                            mvec = [0];
                            [pp1,pp2] = size(wflag);

                            for mj = 1:pp2
                                if mi == wflag(1,mj)
                                    mvec = [mvec,mj];
                                end
                            end
                            mvec(:,1) = [];
                            [mc1,mc2] = size(mvec);

                            for mj = 1:mc2
                                mz = zc{mi};
                                z(1,mvec(1,mj)) = mz(1,mj);
                            end
                        end
                        %nn.a{i}(k,:) = sigm(z);
                        disp(k);
                        disp(i);
                        disp(l);

                        nn.a{i}(k,:) = sigm(z);

                    end

                    if i == 33
                        %nn.a{i} = nn.a{i} + nn.weightPenaltyL1 * sum(abs(nn.W{i - 1}')) + 1.0000e-08 * sum(abs(nn.W{i-1}') .* connect(nn.W{i-1}'));
                        [Wii, wflag] = connect_module2(abs(nn.W{i-1}'));
                        nn.Wii = connect_value(abs(nn.W{i-1}'), Wii, wflag);
                        nn.wflag = wflag;

                        %nn.Wii = connect_module6(abs(nn.W{i-1}'));
                        nn.a{i} = nn.a{i} + nn.alpha * sum(abs(nn.W{i-1}') .* nn.Wii) + nn.weightPenaltyL1 * sum(abs(nn.W{i-1}')) + nn.weightPenaltyL2 * sum(nn.W{i-1}' .* nn.W{i-1}');
                        %nn.a{i} = nn.a{i} + nn.weightPenaltyL1 * sum(abs(nn.W{i - 1}')) + 0 * sum(abs(nn.W{i-1}' .* nn.Wii));
                    else
                        %nn.a{i} = nn.a{i} + nn.weightPenaltyL1 * sum(abs(nn.W{i - 1}'));
                        disp('ok');
                    end
                end

            case 'tanh_opt'
                if i == 2 
                    nn.a{i} = tanh_opt(nn.a{i - 1} * nn.W{i - 1}');
                end
                if i == 3
                    nn.a{i} = zeros(m,10);
                    for k = 1:m

                        ww = nn.W{i - 1};
                        pp = nn.a{i - 1}(k,:);


                        z_G = pp(:,2:end);
                        options = optimset('TolFun',0.0001);
                        z = fsolve(@(x)root6d(x,pp,ww), z_G, options);
                        nn.a{i}(k,:) = tanh_opt(z);
                        disp(k);
                        disp(i);
                        disp(l);


                        %for jj = 1:10
                        %    ss = 0;
                        %    for kk = 1:10
                        %        ss = ss + ww(jj,kk)*tanh_opt(z(1,kk));
                        %    end 


                        %    Fij = z(1,jj)-ss-pp(1,jj);

                        %    %disp(Fij);
                        %end

                    end

                    %nn.a{i} = tanh_opt(nn.a{i - 1} * nn.W{i - 1}');
                end
        end
        
        %dropout
        if(nn.dropoutFraction > 0)
            if(nn.testing)
                nn.a{i} = nn.a{i}.*(1 - nn.dropoutFraction);
            else
                nn.dropOutMask{i} = (rand(-(nn.a{i}))>nn.dropoutFraction);
                nn.a{i} = nn.a{i}.*nn.dropOutMask{i};
            end
        end
        
        %calculate running exponential activations for use with sparsity
        if(nn.nonSparsityPenalty>0)
            nn.p{i} = 0.99 * nn.p{i} + 0.01 * mean(nn.a{i}, 1);
        end
        
        %Add the bias term
        %nn.a{i} = [ones(m,1) nn.a{i}];

        if i == 3
            nn.p{i - 1} = nn.a{i - 1};
            nn.a{i - 1} = [ones(m,1) nn.a{i}];
        end

        nn.a{i} = [ones(m,1) nn.a{i}];
    
    end
    switch nn.output 
        case 'sigm'
            %{
            www1 = nn.W{n - 1}';
            wv = www1(1,:);
            www1(1,:) = [];

            ppppp = sort(www1(:),'descend');
            [ppppp1,ppppp2] = size(ppppp);

            tar = ppppp(floor(ppppp1*0.1),1);
            [wwwww1,wwwww2] = size(www1);
                                            
            for ii = 1:wwwww1
                for jj = 1:wwwww2
                    if www1(ii,jj) < tar
                        www1(ii,jj) = 0;
                    end
                end
            end
            %}

            nn.ww2 = nn.W{n - 1}';

            nn.a{n} = sigm(nn.a{n - 1} * nn.ww2);
        case 'linear'
            nn.a{n} = nn.a{n - 1} * nn.W{n - 1}';
        case 'softmax'
            nn.a{n} = nn.a{n - 1} * nn.W{n - 1}';
            nn.a{n} = exp(bsxfun(@minus, nn.a{n}, max(nn.a{n},[],2)));
            nn.a{n} = bsxfun(@rdivide, nn.a{n}, sum(nn.a{n}, 2)); 
    end

    %error and loss
    nn.e = y - nn.a{n};
    
    switch nn.output
        case {'sigm', 'linear'}
            nn.L = 1/2 * sum(sum(nn.e .^ 2)) / m; 
        case 'softmax'
            nn.L = -sum(sum(y .* log(nn.a{n}))) / m;
    end
end
