t=0;
K = 2;
d= 2;
N=2;
Thetaa = [(rand(K,d)-0.5)*2;zeros(1,d)];  %K+1 by d
D = normrnd(0,1,[N,d]);
Action=[];
T=1000;
for i=t+1:T
    n=1;
    f = randi(N);
    Action=[Action;D(f,:)];
    pp=D(f,:)*Thetaa';
    p=exp(pp)/sum(exp(pp));
    yy=mnrnd(n,p);
    reward(i,1)=find(yy==1);
end

B = mnrfit(Action,reward); %d+1 by K
M = Thetaa'; %d by K+1
M(:,1:K)
B(2:d+1,1:K)
difference = B(2:d+1,1:K)-M(:,1:K);