{
  "agent_path": null,
  "environment": {
    "env_make_kwargs": {},
    "gym_id": "Pendulum-v1",
    "max_episode_steps": 5,
    "num_vec": 2,
    "parallel": false
  },
  "load_reward_kwargs": {},
  "logging": {
    "log_dir": "quickstart/rl/",
    "log_format_strs": [
      "tensorboard",
      "stdout"
    ],
    "log_format_strs_additional": {},
    "log_level": 20,
    "log_root": null,
    "wandb": {
      "wandb_additional_info": {},
      "wandb_kwargs": {
        "monitor_gym": false,
        "project": "imitation",
        "save_code": false
      },
      "wandb_name_prefix": "",
      "wandb_tag": null
    }
  },
  "normalize_kwargs": {},
  "normalize_reward": true,
  "policy": {
    "policy_cls": {
      "py/type": "imitation.policies.base.FeedForward32Policy"
    },
    "policy_kwargs": {}
  },
  "policy_evaluation": {
    "n_episodes_eval": 1
  },
  "policy_save_final": true,
  "policy_save_interval": 2,
  "reward_path": null,
  "reward_type": null,
  "rl": {
    "batch_size": 2,
    "rl_cls": {
      "py/type": "stable_baselines3.ppo.ppo.PPO"
    },
    "rl_kwargs": {
      "batch_size": 2,
      "ent_coef": 0.0,
      "gamma": 0.9,
      "learning_rate": 0.001,
      "n_epochs": 10
    }
  },
  "rollout_save_final": true,
  "rollout_save_n_episodes": null,
  "rollout_save_n_timesteps": 2000,
  "seed": 730787762,
  "total_timesteps": 4
}