envid: MiniHack-Room-Dark-Dense-10x10-v0
target_return: 1
num_envs: 1
norm_obs: False
record: False
record_freq: 1000000
record_length: 2000
reward_scale: 1

# randomly selected positions
# 80 for training, 20 for testing
env_kwargs: 
  random: False
  observation_keys: 
    - tty_cursor

train_start_pos: 
  - [0,0]

train_goal_pos: 
  - [2, 0]

# train tasks for sfixed, grand
eval_start_pos: [0, 0]

eval_goal_pos:  
- [9, 0]
- [8, 4]
- [3, 4]
- [6, 5]
- [7, 5]
- [5, 0]
- [3, 5]
- [9, 8]
- [8, 7]
- [3, 0]
- [6, 6]
- [5, 9]
- [1, 7]
- [5, 1]
- [1, 6]
- [5, 8]
- [2, 1]
- [4, 9]
- [6, 4]
- [6, 8]
