clear all
d=2;
T =1000;
Tprime=10;
delta = 0.01;

N=10;
K=1;

rb = [1:K,0]'; %K+1 by 1
R = norm(rb);
lambda = K*d*log(T);
kappa=202;
while (kappa<20|| kappa>30)  
D = normrnd(0,1,[N,d]);
Thetaa = [normrnd(0,1/K,[K,d]);zeros(1,d)];  %K+1 by d
S=norm(Thetaa(:));
[kappa,L] = kappaandL(D,S,K,N)
for i=1:N
    pp=D(i,:)*Thetaa';
    p=exp(pp)/sum(exp(pp));
    exprew(i)  = p*rb;
end
1
end

xstar = D(find(exprew==max(exprew)),:)';
optimalexpectedreward = max(exprew);
for i=1:20
    RT1(i,:) = MNLUCB(d,D,N,rb,Thetaa,K,T,lambda,delta,S,L,R,kappa,optimalexpectedreward,Tprime);
end

plot(RT1(i,:))
