function Reward=UCWhittleWindow(user, channel, P, w, T, H, gamma, epsilon);
Reward=zeros(1,T);
count0=zeros(user, T);
count1=zeros(user, T);
C0=zeros(1,user);
C1=zeros(1, user);
Caction0=zeros(1,user);
den=ones(1, user);
eta=0.05;
num=2*log(2*user*T/eta);
Pest(1:user)=0.5;
for i=1:user
q(i)=min(sqrt(num/den(i)), 1);
end
for t=1:T
    AoI=zeros(1, user);
    for h=1:H
        a=zeros(1, user);
        for i=1:user
           W(i)=WhittleIndexUC(w(i), AoI(i), Pest(i),q(i));
        end
        [~, index]=maxk(W, channel);
        a(index)=1;
        for i=1:user
            if a(i)==1
                if rand<=P(i, t)
                    count1(i, t)=count1(i, t)+1;
                    AoI(i)=1;
                else
                    count0(i, t)=count0(i, t)+1;
                    AoI(i)=AoI(i)+1;
                end
            else
                AoI(i)=AoI(i)+1;
                Caction0(i)=Caction0(i)+1;
            end
        end
        for i=1:user
        Reward(t)=Reward(t)+gamma^(h-1)*AoIfunction(w(i), AoI(i));
        end
    end
    win=randi(20);
    lw=max(t-win+1, 1);
    for i=1:user
        C0(i)=sum(count0(i, lw:t));
        C1(i)=sum(count1(i, lw:t));
        Pest(i)=C1(i)/(C1(i)+C0(i));
        Pest(i)=min(Pest(i)+num/max(C1(i)+C0(i), 1), 1);
    end
    for i=1:user
     den(i)=max(Caction0(i),1);
     q(i)=min(sqrt(num/den(i)), 1);
    end
end 
