# @package _global_

env_name: MountainCarContinuous-v0
load: false
save: false
reward_curves: false

algorithm:
  agent_class: SAC
  total_timesteps: 1e5
  n_eval_episodes: 5
  policy_model: MlpPolicy
  model_kwargs:
    learning_rate: 0.0003
    batch_size: 256
    tau: 1.0
    gamma: 0.99
    learning_starts: 100
    buffer_size: 1000000
    train_freq: 1
    gradient_steps: 1
    use_sde: False
    sde_sample_freq: -1