defaults:
    - _self_

exp_name: default
seed: 0
log_path: ./logs
save_path: ./checkpoints

load_idx: 0
env_idx: 0

training:
  num_rounds: 50
  starting_episodes: 10
  num_episodes_per_round: 1
  horizon: 500
  num_updates: 40000
  save_interval: 10
  init_index_type: spaced

buffer:
  _target_: buffer.DiscountedValueBuffer
  batch_size: 64

eval:
  num_trajs: 16
  interval: 5

value_function:
  _target_: control.value_functions.DiscreteValueNetwork
  hidden_dims: [256, 256]
  activation: relu
  output_activation: none
  use_batch_norm: false
  ortho_init: false

optimizer:
  _target_: torch.optim.Adam
  lr: 1e-4

offline:
  num_samples: 1000000
  algo: iql
  model_nr: 0

env_config:
  robot: IIWA
  obj: Dumbbell
  obstacle: None
  objective: PickPlace

data_env_configs:
  base_path: <TO SET>"/composuite_logs/"
  robot: ["IIWA", "IIWA"]
  obj: ["Hollowbox", "Dumbbell"]
  obstacle: ["None", "None"]
  objective: ["PickPlace", "Push"]

wandb:
  project: "max-following-rl"
  entity: <TO SET>
  group: <TO SET>

hydra:
  run:
    dir: ./_exp/${exp_name}/${seed}/