{
  "grid" :{
    "env_name":[
      "MiniHack-DoFProHuntSparseRewards-v0"
    ],

    "num_processes": [32],
    "num_env_steps": [175000000],
    "num_steps": [256],
    "ppo_epoch": [5],
    "num_mini_batch":[1],
    "handle_timelimits":[true],

    "lr": [1e-4],
    "gamma": [0.999],
    "entropy_coef": [0.01],

    "recurrent_arch": ["lstm"],
    "recurrent_agent": [true],
    "recurrent_hidden_size": [256],

    "use_plr": [true],
    "level_replay_prob": [0.95],
    "level_replay_rho":[0.5],
    "level_replay_seed_buffer_size":[5000],
    "level_replay_temperature": [0.3],
    "level_replay_strategy": ["positive_value_loss"],
    "level_replay_score_transform": ["rank"],
    "staleness_coef":[0.3],

    "p": ["0.3,0.35,0.35"],
    "reward_dist": ["uniform"],
    "force_obl_correction":[true],
    "fully_observable": [true],
    "no_exploratory_grad_updates":[true],
    "use_learned_beliefs":[false, true],

    "log_interval":[10],
    "archive_interval": [1221],
    "screenshot_interval": [250],
    "log_dir": ["~/logs/samplr"],
    "log_action_complexity": [true],
    "test_env_names":["MiniHack-DoFProHuntSparseRewards-v0"],

    "checkpoint": [true]
  }
}