num_steps: 2000

# batch_size: 32
N: 200
kappa: 1.0
lr: 5.e-5
memory_size: 1000000
gamma: 0.99
multi_step: 1
update_interval: 4
target_update_interval: 100
start_steps: 500
epsilon_train: 0.01
epsilon_eval: 0.001 # DQN : 0.05
epsilon_decay_steps: 2500  # It equals to 1M frames.
double_q_learning: False
dueling_net: False
noisy_net: False
use_per: False
log_interval: 50
eval_interval: 2500
num_eval_steps: 50  
max_episode_steps: 50

