ac_gradient_clip: 100
alpha: 0.2
batch_size: 128
actor_lr: 0.0003
critic_lr: 0.0003
gamma: 0.99
max_epochs_since_update_decay_interval: 150000.0

state_dim: 17
action_dim: 3
hidden_sizes: 256
max_action: 1

temperature_opt: False

tau: 0.005
update_interval: 2
expl_noise: 0.2

eval_episode: 10
eval_freq: 10000
start_steps: 5000
max_step: 1000000
tar_env_interact_freq: 10

device: cuda

save_freq: 50000

env: Ant

src_env_config:
  env_name: Ant-og
tar_env_config:
  env_name: Ant
  param:
    fl hip lower limit:
    - 0.01
    fl hip upper limit:
    - 0.01
    fr hip lower limit:
    - 0.01
    fr hip upper limit:
    - 0.01

likelihood_gate_threshold: 0.75
start_gate_src_sample: 100000.0
