close all;
clear all;
clc;


 
channel=1; %number of channel or M
class=2;
k=5;
user=class*k; %number of user 
T=100; %total number of episodes

P=zeros(user, T); % Probability of successful transmission of users
w=zeros(user,1); % variance of signal values

iteration=50;
%for j=1:iteration
j
for n=1:user
        if n>user/2
            w(n)=0.5;
            P(n, 1)=1;
        else
            w(n)=0.9;
            P(n, 1)=0.1;
        end
end
epsilon=0.5;
errorp=0.1;
epsmax=1;
for t=2:T
    if rand<0.60
        errorp=min(errorp+epsilon, 1);
    else
        errorp=max(errorp-epsilon, 0);
    end
    for n=1:user
        if n>user/2
            P(n, t)=1;
        else
            P(n, t)=errorp;
        end
    end
end

plot(1:T, P(1,:))
xlabel('Episode'); ylabel('Success Probability');


% H=50; % time horizon
% gamma=0.99; % discount factor 
% k=1;
% 
% RWhittle(j, 1:T)=WhittleOracle(user, channel, P, w, T, H, gamma, epsilon);
% %R(j,1:T)=OurPolicy(user, channel, P, w, T, H, gamma, epsilon, win);
% R1(j,1:T)=OurPolicy1(user, channel, P, w, T, H, gamma);
% RUC(j,1:T)=UCWhittle(user, channel, P, w, T, H, gamma, epsilon);
% RUC1(j,1:T)=UCWhittleWindow(user, channel, P, w, T, H, gamma, epsilon);
% Runi(j,1:T)=Uniform(user, channel, P, w, T, H, gamma, epsilon);
% RWIQL(j,1:T)=WIQL(user, channel, P, w, T, H, gamma, epsilon);
% RWIQL1(j,1:T)=WIQLWindow(user, channel, P, w, T, H, gamma, epsilon);
% end
% %R=abs(RWhittle-R);
% R1=abs(RWhittle-R1);
% RUC=abs(RWhittle-RUC);
% RUC1=abs(RWhittle-RUC1);
% Runi=abs(RWhittle-Runi);
% RWIQL=abs(RWhittle-RWIQL);
% RWIQL1=abs(RWhittle-RWIQL1);
% episode=[1, 5:5:50];
% for e=1:length(episode)
%     i=episode(e);
% %Regretiter=zeros(1, iteration);
% Regret1iter=zeros(1, iteration);
% RegretUCiter=zeros(1, iteration);
% RegretUC1iter=zeros(1, iteration);
% Regretuniiter=zeros(1, iteration);
% RegretWIQLiter=zeros(1, iteration);
% for j=1:iteration
%     %Regretiter(j)=sum(R(j,1:i));
%     Regret1iter(j)=sum(R1(j,1:i));
%     RegretUCiter(j)=sum(RUC(j,1:i));
%     RegretUC1iter(j)=sum(RUC1(j,1:i));
%     Regretuniiter(j)=sum(Runi(j,1:i));
%     RegretWIQLiter(j)=sum(RWIQL(j,1:i));
%     RegretWIQL1iter(j)=sum(RWIQL1(j,1:i));
% end
% %Regret(i)=mean(Regretiter);
% %Regretconfidence(i)=1.96*std(Regretiter)/sqrt(iteration);
% Regret1(e)=mean(Regret1iter);
% Regret1confidence(e)=1.96*std(Regret1iter)/sqrt(iteration);
% RegretUC(e)=mean(RegretUCiter);
% RegretconfidenceUC(e)=1.96*std(RegretUCiter)/sqrt(iteration);
% RegretUC1(e)=mean(RegretUC1iter);
% RegretconfidenceUC1(e)=1.96*std(RegretUC1iter)/sqrt(iteration);
% RegretWIQL(e)=mean(RegretWIQLiter);
% RegretconfidenceWIQL(i)=1.96*std(RegretWIQLiter)/sqrt(iteration);
% RegretWIQL1(e)=mean(RegretWIQL1iter);
% RegretconfidenceWIQL1(e)=1.96*std(RegretWIQL1iter)/sqrt(iteration);
% Regretuni(e)=mean(Regretuniiter);
% Regretconfidenceuni(e)=1.96*std(Regretuniiter)/sqrt(iteration);
% end
% % figure(1)
% % semilogy(1:T, Regretuni, 'b-.',1:T, RegretUC,'r--',1:T, RegretWIQL,  'm--',1:T, RegretWIQL,  'mx-', 1:T,RegretUC1,'rx-', 1:T, Regret,'k-', 1:T,  Regret1, 'kd-');
% % xlabel('Episode'), ylabel('Reg(T)') 
% % legend('Random', 'UCWhittle','WIQL', 'WIQLWindow','UCWhittleWindow','OurPolicy', 'OurPolicy1')
% % 
% figure(1)
% semilogy(episode, Regretuni, 'b-.',episode, RegretUC,'rx-',episode, RegretWIQL,  'ms--', episode,RegretUC1,'ro-', episode,  Regret1, 'k-');
% xlabel('Episode'), ylabel('Reg(T)') 
% legend('Random', 'UCWhittle','WIQL','UCWhittleWindow', 'OurPolicy1')
% 
% 
% 
% 
% 
% 
% 
%     
