{
  "name": "Delayed RL Door Key | Softmax AE | Sweep",

  "project": "model-free-minigrid",

  "command": "python model_free/train.py",

  "algorithm": "grid",

  "spec": {
    "metric": "reward",
    "objective": "maximize",
    "retryAssignLimit": 4
  },

  "trials": 3,

  "parameters": {
    "comet_ml": True,
    "ae_recon_loss": True,
    "ae_er_train": True,
    "device": "cuda",
    "log_freq": 10000,
    "learning_rate": 0.0003,
    "batch_size": 256,
    "mf_steps": 2500000,
    "embedding_dim": 64,
    "env_max_steps": 1000,
    "n_ae_updates": 8,
    "ppo_batch_size": 64,
    "ppo_value_coef": 0.5,
    "ppo_iters": 10,
    "ppo_clip": 0.2,
    "rl_start_step": 500000,

    "ae_model_type": "softmax_ae",

    "env_name": "minigrid-door-key-stochastic",
    "stochastic": "categorical",

    
    "filter_size": {
      "type": "discrete",
      "values": [4, 6, 8]
    },
    "codebook_size": {
      "type": "discrete",
      "values": [32, 64, 128, 256, 512]
    }
  }
}