Parameter,Value
epsilon_wibql,1
C_one_wibql,0.1
Cp_wibql,0.2
replay_buffer_size_wibql,60000
num_replays_per_dream_wibql,1000
replay_period_wibql,1000000
lambda_bound_wibql,-1
learn_divisor_wibql,500
epsilon_divisor_wibql,500
epsilon_maiql,1
C_one_maiql,0.1
Cp_maiql,0.2
replay_buffer_size_maiql,60000
num_replays_per_dream_maiql,1000
replay_period_maiql,10
lambda_bound_maiql,-10000
learn_divisor_maiql,500
epsilon_divisor_maiql,500
epsilon_lpql,1
C_one_lpql,0.1
replay_buffer_size_lpql,60000
num_replays_per_dream_lpql,1000
replay_period_lpql,1000000
lambda_bound_lpql,1
learn_divisor_lpql,500
epsilon_divisor_lpql,500
epsilon_lam0,1
C_one_lam0,0.2
replay_buffer_size_lam0,60000
num_replays_per_dream_lam0,1000
replay_period_lam0,100
learn_divisor_lam0,500
epsilon_divisor_lam0,500
epsilon_maiql_aprx,1
C_one_maiql_aprx,0.4
replay_buffer_size_maiql_aprx,60000
num_replays_per_dream_maiql_aprx,1000
replay_period_maiql_aprx,100
lambda_bound_maiql_aprx,3
learn_divisor_maiql_aprx,500
epsilon_divisor_maiql_aprx,500