
reset;                # Title: Product Usage under Aging Effects: Learning and Earning using Markov Chains

option randseed'';    # estimation good if either T or N are not large 
                      # estimation bad if N large and data contains only long step observations (skewed)

param T default 50;   # number of states
param N default 15+1; # number of nodes in the chain (max 500 bei T=20)
param A default 5;    # number of usage actions
param K := T-1;       # number of probs to estimate in main bandmatrix
param R := 1;        # number of sim runs

param gap default 0.0;   # parameter G
param KKK default 1000;  # number of data observations

param Ny{n in 1..N-1} := if n>gap*(N-1) then KKK/(N-1-gap*(N-1));  # number of n-step training observations 

param KK:= sum{n in 1..N-1} Ny[n];  

param fs {i in 1..T,j in 1..T,a in 1..A} := if i=j<T then 1-0.5*(a+i)/(A+T)/(N-1)^0.5    
                                                         else if i=j-1 then 1-fs[i,i,a]     # main transition probabilities to be found
							 else if i=j=T then 1 else 0;       
							 
param pp_true{i in 1..T,a in 1..A} := fs[i,i,a];

param Pn{i in 1..T,j in 1..T,n in 1..N-1,a in 1..A} := if n=1 then fs[i,j,a]  # n steps forward true transition matrix
                                 else sum{k in 1..T} Pn[i,k,n-1,a]*fs[k,j,a];


param x {n in 1..N-1,i in 1..Ny[n],k in 1..2} default if k=1 then round(Uniform(0.5,T-0.5))  # state feature data 1-step
                                                        else round(Uniform(0.5,A+0.5)); # used (average) action

param p_true {i in 1..K,j in 1..T,n in 1..N-1,a in 1..A} := Pn[i,j,n,a];   # unknown true impact 3-step of P3 needed for sim

param z{n in 1..N-1,i in 1..Ny[n]} default Uniform(0,1);
param y{n in 1..N-1,i in 1..Ny[n]} default if x[n,i,1]=T then T 
                                      else min{ii in 1..T:sum{j in 1..ii} p_true[x[n,i,1],j,n,x[n,i,2]] > z[n,i]} ii;
				  	  			  			  
###########    structure of n-step transition Matrices Pn as function of p_k

var b {k in 1..K,a in 1..A} <=500, := Uniform(0,1);			    # beta coefficients (for logit probs)
var p {k in 1..K,a in 1..A} = exp(b[k,a])/(1+exp(b[k,a]));      # probs for main bandmatrix

#################    Diagonalisierung     #####################

var zv{i in 1..K,j in i..K  ,a in 1..A} = prod{k in i..j}  (p[k,a]-1);       # lambda
var nv{i in 1..K,j in i+1..K,a in 1..A} = prod{k in i+1..j}(p[i,a]-p[k,a]);  # theta
var nu{i in 2..K,j in 1..i-1,a in 1..A} = prod{k in j..i-1}(p[i,a]-p[k,a]);  # kappa
                                         
var U {i in 1..T,j in 1..T,a in 1..A}   = if j=1   then 1                                    
                           				 else if j=i+1 then 1
  				                         else if i>=j  then 0
							 else               zv[i,j-2,a]/(if nu[j-1,i,a]=0 then 10^-9 else nu[j-1,i,a]) * (-1)^(i+j-1);      # rest rechts oben
					
var Dn{i in 1..T,j in 1..T,n in 1..N-1,a in 1..A}   = if i=j=1 then 1 else if i=j then p[i-1,a]^n else 0;

var V {i in 1..T,j in 1..T,a in 1..A}   = if i=1   then (if j=T then 1 else 0)   
                            				 else if i=j+1 then 1						 
							 else if i>j   then 0
							 else if i=j=T then -1
							 else if j=T   then zv[i,K,a]    /(if nv[i-1,K,a]=0 then 10^-9 else nv[i-1,K,a]) * (-1)^(i+j-1)     # letzte Spalte
							 else               zv[i-1,j-1,a]/(if nv[i-1,j,a]=0 then 10^-9 else nv[i-1,j,a]) * (-1)^(i+j-1);    # rest rechts oben


#var Pnn{i in 1..T,j in i..T,n in 1..N-1,a in 1..A} = sum{k in 1..T} U[i,k,a]*(if k=1 then 1 else p[k-1,a]^n)*V[k,j,a];


###########    logit optimality conditions    ###########

maximize LL: 1/T/KK*sum{n in 1..N-1} sum{i in 1..Ny[n]}
#                     ( log(  max(Pnn[x[n,i,1],y[n,i],n,x[n,i,2]],0) + 10^-19) );	 
                      ( log(  max(sum{k in 1..T} U[x[n,i,1],k,x[n,i,2]]*(if k=1 then 1 else p[k-1,x[n,i,2]]^n)*V[k,y[n,i],x[n,i,2]],0) + 10^-19) );	 
					 

option solver minos; solve; 


display p,pp_true;

display _solve_elapsed_time;
display _ampl_time;

param time default 0; let time:= _ampl_time;
#end;

##########  EM Solution  #########

param pem{i in 1..T-1,a in 1..A} default 0.15;   #for {i in 1..T-1,a in 1..A} let pem[i,a] := p[i,a];

param fsem {i in 1..T,j in 1..T,a in 1..A} default 1/T;  #if i=j<T then pem[i,a] else if i=j-1 then 1-pem[i,a] else if i=j=T then 1 else 0;       

param Pnem{i in 1..T,j in 1..T,n in 1..N-1,a in 1..A} default 1/T; # if n=1 then fsem[i,j,a] else sum{k in 1..T} Pnem[i,k,n-1,a]*fsem[k,j,a];

param EN0{i in 1..T-1,a in 1..A} default 0.5;
param EN1{i in 1..T-1,a in 1..A} default 0.5;

param test {i in 1..T-1,a in 1..A} default 10; #pem[i,a] - EN0[i,a]/(EN0[i,a]+EN1[i,a]);


#######

for {jj in 1..600} {
#display pem, test, EN0, EN1;

for {i in 1..T,j in 1..T,a in 1..A} let fsem[i,j,a] := if i=j<T then pem[i,a] else if i=j-1 then 1-pem[i,a] else if i=j=T then 1 else 0;  

for {i in 1..T,j in 1..T,n in 1..N-1,a in 1..A} let Pnem[i,j,n,a] := if n=1 then fsem[i,j,a] else sum{k in 1..T} Pnem[i,k,n-1,a]*fsem[k,j,a];

for {i in 1..T-1,a in 1..A} let EN0[i,a]:= sum{n in 1..N-1,k in 1..Ny[n]:x[n,k,2]=a}    pem[i,x[n,k,2]]  / max(Pnem[x[n,k,1],y[n,k],n,x[n,k,2]],10^-19) *
                                           sum{t in 0..n-1} (if t=0 then (if x[n,k,1]=i then 1) else Pnem[x[n,k,1],i,t,x[n,k,2]]) * (if n-t-1=0 then (if y[n,k]=i   then 1) else Pnem[i,y[n,k],n-t-1,x[n,k,2]]);;

for {i in 1..T-1,a in 1..A} let EN1[i,a]:= sum{n in 1..N-1,k in 1..Ny[n]:x[n,k,2]=a} (1-pem[i,x[n,k,2]]) / max(Pnem[x[n,k,1],y[n,k],n,x[n,k,2]],10^-19) *
                                           sum{t in 0..n-1} (if t=0 then (if x[n,k,1]=i then 1) else Pnem[x[n,k,1],i,t,x[n,k,2]]) * (if n-t-1=0 then (if y[n,k]=i+1 then 1) else Pnem[i+1,y[n,k],n-t-1,x[n,k,2]]);;

for {i in 1..T-1,a in 1..A} let test[i,a] := abs(pem[i,a] - EN0[i,a]/max(10^-10,EN0[i,a]+EN1[i,a]));;

if max{i in 1..T-1} test[i,1] <0.0001 then {display jj; display test; break;};

for {i in 1..T-1,a in 1..A} let pem[i,a] := EN0[i,a]/max(10^-6,EN0[i,a]+EN1[i,a]);;
                     };


display p,pp_true,pem;

display time, _ampl_time-time;

display _solve_elapsed_time;

end;










var EN0{i in 1..T-1,a in 1..A} = sum{n in 1..N-1,k in 1..Ny[n]}    p[i,a]  / max(Pnn[x[n,k,1],y[n,k],n,a],10^-19) *   # korrekt aber lokale Lösung oft schlecht
                                 sum{t in 0..n-1} (if t=0 then 1 else Pnn[x[n,k,1],i,t,a]) * (if n-t-1=0 then 1 else Pnn[i,y[n,k],n-t-1,a]);


var test {i in 1..T-1,a in 1..A} = p[i,a] - EN0[i,a]/(EN0[i,a]+EN1[i,a]);



display mape,mae,LL,KK,gap;
display p,pp_true;
display _solve_elapsed_time;

param pem  {i in 1..T-1,a in 1..A} default 0;

for {jj in 1..10000} {
display p, test,EN0, EN1;
if sum{i in 1..T-1} abs(test[i,1]) <0.0001 then {display jj; display test; break;};
for {i in 1..T-1,a in 1..A} let pem[i,a]:=EN0[i,a]/(EN0[i,a]+EN1[i,a]);
for {i in 1..T-1,a in 1..A} let p[i,a]:=pem[i,a];
                  };

display mape,mae,LL,KK,gap;
display p,pp_true;
display _solve_elapsed_time;

objective LL;
subject to nb2 {i in 1..T-1,a in 1..A}: p[i,a] = exp(b[i,a])/(1+exp(b[i,a]));

solve;

display mape,mae,LL,KK,gap;
display p,pp_true;
display _solve_elapsed_time;

display zfk2;

end;




for{kkk in 1..R} {
	option randseed 0;
	display kkk;
	for{n in 1..N-1,i in 1..Ny[n],k in 1..2} let x[n,i,k] := if k=1 then round(Uniform(0.5,T-0.5))  # state feature data 1-step
                                                        else round(Uniform(0.5,A+0.5)); # used (average) action
	for{n in 1..N-1,i in 1..Ny[n]} let z[n,i] := Uniform(0,1);
    for{n in 1..N-1,i in 1..Ny[n]} let y[n,i] := if x[n,i,1]=T then T 
                                      else min{ii in 1..T:sum{j in 1..ii} p_true[x[n,i,1],j,n,x[n,i,2]] > z[n,i]} ii;
	for {k in 1..K,a in 1..A} let b[k,a] := Uniform(0,1);
	solve;
	display mape,mae,LL,KK,gap; display _solve_elapsed_time;
	let results[kkk,1]:=mape;
	let results[kkk,2]:=mae;
	let results[kkk,3]:=_solve_elapsed_time;
                 };

	display muresults;
	display s2results;	
	printf"%3i %6.3f %6.3f %6.3f %6.3f %6.2f %6.3f\n", T, 
	muresults[1], s2results[1], muresults[2], s2results[2], muresults[3], s2results[3]  >> aging_observable_T_out.txt;

	display p,pp_true;					   
end;










