dataset_path: "/insert_directory_here/"
meta_id: mocap_meta
data_file: mocap_annotations
of_file: mocap_img_feats
meta_wild_id: real_mocap
data_wild_file: real_annotations
of_file_wild: real_img_feats

mujoco_model: 'humanoid_smpl_neutral_mesh'
seed: 2
fr_num: 100
augment: false

use_of: false
use_head: true
use_action: true
use_vel: false
use_context: false
smooth: True

model_specs:
  model_v: 1
  rnn_hdim: 1024
  cnn_fdim: 512
  mlp_hsize: [1024, 512, 256]
  mlp_htype: 'relu'
  rnn_type: "gru"
  w_rp: 50.0
  w_rr: 50.0
  w_p: 1.0
  w_v: 1.0
  w_ee: 10.0
  w_op: 1.0
  w_or: 10.0

policy_specs:
  policy_v: 1
  log_std: -3.2
  fix_std: true
  gamma: 0.95
  tau: 0.95
  policy_htype: relu
  policy_hsize: [512, 256]
  policy_optimizer: 'Adam'
  # policy_lr: 5.e-6
  policy_lr: 1.e-5
  policy_momentum: 0.0
  policy_weightdecay: 0.0
  value_htype: relu
  value_hsize: [512, 256]
  value_optimizer: 'Adam'
  value_lr: 3.e-4
  value_momentum: 0.0
  value_weightdecay: 0.0
  clip_epsilon: 0.2
  min_batch_size: 10000
  mini_batch_size: 10000
  fix_std: true
  reward_id: 'dynamic_supervision_v1'
  end_reward: false
  max_iter_num: 20000
  save_model_interval: 50
  rl_update: true
  init_update: false
  step_update: true
  full_update: false
  sampling_temp: 0.3
  sampling_freq: 0.5
  num_init_update: 3
  num_step_update: 20
  num_optim_epoch: 10

  reward_weights:
    w_hp: 0.15
    w_hq: 0.15
    w_p: 0.2
    w_jp: 0.2
    w_act_p: 0.2
    w_act_v: 0.1

    k_hp: 45
    k_hq: 45
    k_p: 50
    k_jp: 50
    k_act_p: 5
    k_act_v: 0.005

lr: 5.e-4
weightdecay: 0.0
num_epoch: 10000
num_epoch_fix: 100
num_sample: 2000
batch_size: 256
iter_method: iter
shuffle: true
save_model_interval: 50
fr_margin: 5
has_z: true

add_noise: true
noise_std: 0.01

obs_coord: 'heading'
root_deheading: true
obs_global: true
obs_max_out: true
obs_max_out_dist: 0.5
obs_quat: true

