{
  "name": "Delayed RL Door Key | VQVAE | Best",

  "project": "model-free-minigrid",

  "command": "python model_free/train.py",

  "algorithm": "grid",

  "spec": {
    "metric": "reward",
    "objective": "maximize",
    "retryAssignLimit": 4
  },

  "trials": 30,

  "parameters": {
    "comet_ml": True,
    "ae_recon_loss": True,
    "ae_er_train": True,
    "device": "cuda",
    "log_freq": 10000,
    "learning_rate": 0.0003,
    "batch_size": 256,
    "mf_steps": 4000000,
    "embedding_dim": 64,
    "env_max_steps": 1000,
    "n_ae_updates": 8,
    "ppo_batch_size": 64,
    "ppo_value_coef": 0.5,
    "ppo_iters": 10,
    "ppo_clip": 0.2,
    "rl_start_step": 500000,

    "ae_model_type": "vqvae",
    "filter_size": 6,
    "codebook_size": 256,

    "env_name": "minigrid-door-key-stochastic",
    "stochastic": "categorical"
  }
}