{
  "name": "Delayed RL Door Key | FTA AE | Sweep",

  "project": "model-free-minigrid",

  "command": "python model_free/train.py",

  "algorithm": "grid",

  "spec": {
    "metric": "reward",
    "objective": "maximize",
    "retryAssignLimit": 4
  },

  "trials": 3,

  "parameters": {
    "comet_ml": True,
    "ae_recon_loss": True,
    "ae_er_train": True,
    "device": "cuda",
    "log_freq": 10000,
    "learning_rate": 0.0003,
    "batch_size": 256,
    "mf_steps": 2500000,
    "embedding_dim": 64,
    "env_max_steps": 1000,
    "n_ae_updates": 8,
    "ppo_batch_size": 64,
    "ppo_value_coef": 0.5,
    "ppo_iters": 10,
    "ppo_clip": 0.2,
    "rl_start_step": 500000,

    "ae_model_type": "fta_ae",

    "env_name": "minigrid-door-key-stochastic",
    "stochastic": "categorical",

    
    "latent_dim": {
      "type": "discrete",
      "values": [16, 64, 256, 1024]
    },
    "fta_tiles": {
      "type": "discrete",
      "values": [8, 16, 32, 64]
    },
    "fta_eta": {
      "type": "discrete",
      "values": [0.125, 0.25, 0.5]
    }
  }
}