cell_net_arch:
  cnn:
  - [-1, 32, 3, 1, 1]
  - [32, 64, 3, 2, 1]
  - [64, 64, 3, 2, 1]
  mlp: [-1, 128, 128]
cell_shape: !!python/tuple [8, 11, 8]
env_config: {max_room_step: 3000, mr_stype: 1}
env_name: MontezumaRevengeNoFrameskip-v4
env_type: Atari
ext_adv_coeff: 1
ext_gamma: 0.99
extra_hidden_size: 512
feature_net_arch:
  cnn:
  - [-1, 32, 8, 4, 0]
  - [32, 64, 4, 2, 0]
  - [64, 64, 3, 1, 0]
  mlp: [-1, 512, 512]
int_adv_coeff: 6
int_gamma: 0.99
lr: 0.00025
max_frames_per_episode: 18000
n_actions: 18
n_mini_batch: 16
n_workers: 128
obs_is_color: true
obs_shape: !!python/tuple [1, 84, 84]
rnd_hidden_size: 128
rollout_length: 512
sla_reward: 0.01
sla_reward_clip: 3
sla_shortest_coeff: 1000
sla_value_model_type: 0
state_shape: !!python/tuple [4, 84, 84]
total_rollouts_per_env: 25000
