alpha: 0.2
batch_size: 128
actor_lr: 0.0003
critic_lr: 0.0003
gamma: 0.99
max_epochs_since_update_decay_interval: 150000.0

state_dim: 17
action_dim: 3
hidden_sizes: 256
max_action: 1

temperature_opt: False

tau: 0.005
update_interval: 2
expl_noise: 0.2

eval_episode: 10
eval_freq: 10000
start_steps: 5000
max_step: 1000000
tar_env_interact_freq: 10

device: cuda

save_freq: 50000

lam: 0.7
temp: 3.0
proportion: 0.25
metric: 'cosine'

env: Walker

tar_env_config:
  env_name: Walker
  param:
    right foot jnt lower limit:
    - 0.01
    right foot jnt upper limit:
    - 0.01

