num_steps: 50000000  # It equals to 200M frames.
batch_size: 32
N: 64
N_dash: 64
K: 32
num_cosines: 64
kappa: 1.0
lr: 5.e-5
memory_size: 1000000
gamma: 0.99
multi_step: 1
update_interval: 1 #4
target_update_interval: 1000 #10000
start_steps: 2500 #50000
epsilon_train: 0.01
epsilon_eval: 0.001
epsilon_decay_steps: 250000  # It equals to 1M frames.
double_q_learning: False
dueling_net: False
noisy_net: False
alea_comparison_measure: "wang"
alea_comparison_hyps: !!python/tuple [0.0]
epi_comparison_measure: "oneversusall"
epi_comparison_hyps: !!python/tuple [0., 2]
epistemic_method: "ensemble"
num_ensembles: 50
use_per: False
log_interval: 1
eval_interval: 250000
num_eval_steps: 1250 #125000  # It equals to 500k frames.
max_episode_steps: 27000
grad_cliping: 10.
