# Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
#
# NVIDIA CORPORATION and its licensors retain all intellectual property
# and proprietary rights in and to this software, related documentation
# and any modifications thereto.  Any use, reproduction, disclosure or
# distribution of this software and related documentation without an express
# license agreement from NVIDIA CORPORATION is strictly prohibited.
agent:
  name: td3
  cls: agent.td3.TD3Agent
  params:
    obs_dim: ???
    action_dim: ???
    action_range: ???
    goal_dim: ???
    device: ${device}
    discount: 0.99
    critic_tau: 0.005
    batch_size: 256
    learnable_temperature: true

# Environment
env: reacher_easy
goal_mode: single_goal

# this needs to be specified manually
experiment: vanilla

num_train_steps: 1e7
replay_buffer_capacity: ${num_train_steps}

num_seed_steps: 500

eval_frequency: 30
num_eval_episodes: 10

device: cuda

# logger
log_frequency: 10000
log_save_tb: true
ckpt_frequency: 50

reload_weights: True

# video recorder
save_video: true

seed: 1

# hydra configuration
hydra:
    run:
        dir: ./runs/${now:%Y.%m.%d}/${env}_${goal_mode}_${experiment}_${hydra.job.override_dirname}
