function RT = MNLUCB(d,D,N,rb,Thetaa,K,T,lambda,delta,S,L,R,kappa,optimalexpectedreward,Tprime)


theta(:,:,1)=zeros(K+1,d);
V(:,:,1)=kappa*lambda*eye(d);
% e=@(k,n) [zeros(k-1,1);1;zeros(n-k,1)];
Action = [];



for t=1:Tprime
    f(t)=randi(N);
    x(:,t) = D(f(t),:)';
    Action = [Action;x(:,t)'];
    pp=x(:,t)'*Thetaa';
    p=exp(pp)/sum(exp(pp));
    yy(t,:)=mnrnd(1,p);    
    reward(t,1) = find(yy(t,:)==1);
    expectedreward(t,1) = p*rb;
    for j=1:K        
        V(:,:,t) = V(:,:,t)+ x(:,t)*x(:,t)';
    end
    V(:,:,t+1) = V(:,:,t);
   
end

 B = mnrfit(Action,reward);
 theta(:,:,Tprime+1) = [B(2:d+1,1:K)';zeros(1,d)];



for t=Tprime+1:T
    clear B
    betaa = ((K^(3/2))*d*log(1+(t/d/lambda))/sqrt(lambda))+(sqrt(lambda/K)/2)+((2*K^(3/2))*d*log(2/delta)/sqrt(lambda))+(S*sqrt(lambda));
    for i=1:N
        M(i,t) = sqrt(D(i,:)*inv(V(:,:,t))*D(i,:)');
        Delta(i,t) = 2*R*L*betaa*sqrt(kappa*(1+2*S))*M(i,t);
        ppi=D(i,:)*theta(:,:,t)';
        pi=exp(ppi)/sum(exp(ppi));
        upper(i,t) = pi*rb+Delta(i,t);
    end
    
  
    m(t,1) = find(upper(:,t)==max(upper(:,t)));
    x(:,t) = D(m(t,1),:)';
    Action = [Action;x(:,t)'];
    pp=x(:,t)'*Thetaa';
    p=exp(pp)/sum(exp(pp));
    yy(t,:)=mnrnd(1,p);
    
    reward(t,1) = find(yy(t,:)==1);
    expectedreward(t,1) = p*rb;
          
    V(:,:,t+1) = V(:,:,t)+ x(:,t)*x(:,t)';
    B = mnrfit(Action,reward);
    theta(:,:,t+1) = [B(2:d+1,1:K)';zeros(1,d)];
end


RR = optimalexpectedreward - expectedreward;
for ii=1:t
    RT(ii) = sum(RR(1:ii));
end