experiment_name: p2m
root_dir: cca/results/p2m
verbose: true

source_morph: point
target_morph: maze2d
maze_type: medium

source_env_id: ${source_morph}-${maze_type}-v1
target_env_id: ${target_morph}-${maze_type}-v1
source_dataset: ./datasets/${source_morph}/${source_env_id}.hdf5
target_dataset: ./datasets/${target_morph}/${target_env_id}.hdf5
max_steps: 2e5

source_domain_id: 0
target_domain_id: 1
domain_dim: 2

reverse_source_observations: True
reverse_source_actions: False
reverse_target_observations: False
reverse_target_actions: False
aux_reward_only: True

source_coef: 0.0
target_coef: 1.0
alpha: 1.0

inference_task_ids:
  - 7

policy:
  pi:
    - 300
    - 200
  qf:
    - 400
    - 300

bc:
  num_epoch: 30
  log_interval: 10
  batch_size: 256
  lr: 1e-3

transfer:
  max_steps: ${max_steps}
  log_interval: 5
  lr: 1e-3
  alpha: 1.0
  eval_freq: -1
  n_eval_episodes: 20

device: cuda:0
