experiment_name: eval_p2a
logdir: null
verbose: true
debug: false

source_morph: point
target_morph: ant
maze_type: medium

root_dir: ./results/eval_p2a
train_alignment: true
evaluate_alignment: false
evaluate_by_inference_task: false
train_adaptation: true
evaluate_adaptation: true

source_env_id: ${source_morph}-${maze_type}-v1
target_env_id: ${target_morph}-${maze_type}-v1
source_dataset: ./datasets/${source_morph}/${source_env_id}.hdf5
target_dataset: ./datasets/${target_morph}/${target_env_id}.hdf5

seed: null
num_epoch: 40
log_interval: 10
batch_size: 512
lr: 1e-4
disc_lr: 1e-4
h: 512
betas:
- 0.9
- 0.999
max_dataset_size: 2000000
traj_len: 1
label_smoothing: 0.0
train_ratio: 0.9
source_coef: 1
target_coef: 1
adversarial_coef: 0.5
inference_task_ids:
  - 7
no_task_id: false

policy:
  lr: ${lr}
  state_dim: -1
  cond_dim: -1
  domain_dim: 2
  out_dim: -1
  hid_dim: ${h}
  latent_dim: ${h}
  num_hidden_layers:
  - 4
  - 6
  - 4
  activation: mish
  latent_activation: tanh
  norm: none
  use_domain_id: true
  spectral_norm: false
  encoder_decay: 0.0
  decode_with_state: False

discriminator:
  enable: true
  coef: ${adversarial_coef}
  use_task_id: true
  lr: ${disc_lr}
  alpha: false
  spectral_norm: false
  activation: "relu"

reverse_source_observations: true
reverse_source_actions: false
reverse_target_observations: false
reverse_target_actions: false

source_domain_id: 0
target_domain_id: 1

device: cuda:0
evaluate_args: {
  visualize_latents: true,
  visualize_episodes: true,
  evaluate: true,
  processes: 1,
  latents_size: 2000,
  max_dataset_size: 100000,
  batch_size: 5000,
  num_eval_episodes: 100,
  num_visualize_episodes: 4,
  skip_frames: 5,
  fps: 20,
}
adapt_args: {
  max_dataset_size: 100000,
  num_epoch: 50,
  log_interval: 25,
  batch_size: "${batch_size}",
  lr: "${lr}",
  betas: [0.9, 0.999],
  model_path: None,
  policy.lr: "${lr}",
}
