{
  "name": "Changing Delayed Crossing | E2E | Best",

  "project": "discrete_mbrl-mf_chainging_best",

  "command": "python model_free/train.py",

  "algorithm": "grid",

  "spec": {
    "metric": "reward",
    "objective": "maximize",
    "retryAssignLimit": 4
  },

  "trials": 30,

  "parameters": {
    "comet_ml": True,
    "ae_recon_loss": False,
    "ae_er_train": False,
    "e2e_loss": True,
    "device": "cuda",
    "log_freq": 2500,
    "learning_rate": 0.0003,
    "batch_size": 256,
    "mf_steps": 600000,
    "embedding_dim": 64,
    "env_change_freq": 40000,
    "env_max_steps": 400,
    "n_ae_updates": 8,
    "ppo_batch_size": 64,
    "ppo_value_coef": 0.5,
    "ppo_iters": 10,
    "ppo_clip": 0.2,
    "rl_start_step": 0,
    "env_change_type": "random",

    "ae_model_type": "ae",
    "latent_dim": 256,

    "env_name": "minigrid-crossing-stochastic-rand",
    "stochastic": "categorical"
  }
}