fabric:
  _target_: lightning.fabric.Fabric
  _convert_: all
  accelerator: gpu
  devices: ${ngpu}
  num_nodes: ${nodes}
  strategy:
    _target_: lightning.fabric.strategies.DDPStrategy
    find_unused_parameters: true
  precision: ${amp_precision}
  loggers:
  - _target_: lightning.fabric.loggers.TensorBoardLogger
    root_dir: ${save_dir}
ngpu: 1
nodes: 1
torch_deterministic: false
amp_precision: 32-true
force_flat_terrain: false
eval_overrides:
  ngpu: 1
  nodes: 1
  fabric:
    loggers: null
  headless: false
  num_envs: 1
  auto_load_latest: false
  vae_latent_from_prior: true
  vae_noise_type: zeros
  gt_actor_path: null
  algo:
    config:
      dagger:
        collect_data_with_expert: false
  env:
    config:
      max_episode_length: 10000
      enable_height_termination: false
      mimic_fixed_motion_per_env: false
      mimic_motion_sampling:
        init_start_prob: 1.0
        init_random_prob: 0
      mimic_reset_track:
        steps_min: 1000000
        steps_max: 1000001
      masked_mimic_masking:
        start_without_history_prob: 0
      mimic_early_termination: null
      mimic_dynamic_sampling:
        enabled: false
  masked_mimic_report_full_body_metrics: false
  scene_file: data/yaml_files/samp_scenes_test.yaml
algo:
  _target_: phys_anim.agents.mimic_vae_dagger.MimicVAEDagger
  _recursive_: false
  config:
    models:
      terrain_models:
        mlp:
          _target_: phys_anim.agents.models.common.Flatten
          config:
            normalize_obs: false
            obs_clamp_value: ${algo.config.obs_clamp_value}
          num_in: ${terrain.config.terrain_obs_num_samples}
          num_out: ${.num_in}
        transformer:
          _target_: phys_anim.agents.models.mlp.MLP_WithNorm
          config:
            initializer: ${algo.config.actor.config.initializer}
            units: ${oc.select:algo.config.models.transformer_obs_units,???}
            activation: ${algo.config.actor.config.activation}
            use_layer_norm: ${algo.config.actor.config.use_layer_norm}
            normalize_obs: ${algo.config.normalize_obs}
            obs_clamp_value: ${algo.config.obs_clamp_value}
            encoder_input_dim: ${terrain.config.terrain_obs_num_samples}
            operations:
            - type: encode
            - type: reshape
              new_shape:
              - batch_size
              - 1
              - ${algo.config.models.terrain_models.transformer.num_out}
          num_in: ${terrain.config.terrain_obs_num_samples}
          num_out: ${oc.select:algo.config.actor.config.mu_model.config.transformer_token_size,???}
      encoder_preprocessor_units:
      - 1024
      - 1024
      - 1024
      encoder_preprocessor_output_dim: 1024
      prior_preprocessor_output_dim: ${algo.config.models.prior_pre_processor.config.latent_dim}
      prior_preprocessor_units:
      - 256
      - 256
      prior_output_units:
      - 256
      - 128
      encoder_output_units:
      - 512
      encoder_pre_processor:
        _target_: phys_anim.agents.models.mlp.MultiHeadedMLP
        _recursive_: false
        config:
          initializer: ${algo.config.actor.config.initializer}
          units: ${algo.config.models.encoder_preprocessor_units}
          activation: ${algo.config.actor.config.activation}
          normalize_obs: ${algo.config.normalize_obs}
          obs_clamp_value: ${algo.config.obs_clamp_value}
          use_layer_norm: ${algo.config.actor.config.use_layer_norm}
          extra_inputs:
            terrain: ${algo.config.models.terrain_models.mlp}
            mimic_target_poses: ${algo.config.models.mimic_target_pose_model}
            masked_mimic_target_bodies_masks: ${algo.config.models.masked_mimic_target_bodies_mask_model}
        num_out: ${algo.config.models.encoder_preprocessor_output_dim}
      vae_encoder_model:
        _target_: phys_anim.agents.models.mlp.MultiOutputNetwork
        _recursive_: false
        config:
          normalize_obs: false
          obs_clamp_value: null
          trunk: ${algo.config.models.encoder_pre_processor}
          outputs:
            mu:
              _target_: phys_anim.agents.models.mlp.MLP_WithNorm
              config:
                initializer: ${algo.config.actor.config.initializer}
                units: ${algo.config.models.encoder_output_units}
                activation: ${algo.config.actor.config.activation}
                normalize_obs: false
                obs_clamp_value: null
                use_layer_norm: ${algo.config.actor.config.use_layer_norm}
              num_in: ${algo.config.models.encoder_preprocessor_output_dim}
              num_out: ${algo.config.actor.config.vae_latent_dim}
            logvar:
              _target_: phys_anim.agents.models.mlp.MLP_WithNorm
              config:
                activation: ${algo.config.actor.config.activation}
                use_layer_norm: ${algo.config.actor.config.use_layer_norm}
                initializer: ${algo.config.actor.config.initializer}
                units: ${algo.config.models.encoder_output_units}
                normalize_obs: false
                obs_clamp_value: null
              num_in: ${algo.config.models.encoder_preprocessor_output_dim}
              num_out: ${algo.config.actor.config.vae_latent_dim}
        num_out: ${algo.config.actor.config.vae_latent_dim}
      prior_pre_processor:
        _target_: phys_anim.agents.models.transformer.TransformerWithNorm
        _recursive_: false
        config:
          initializer: ${algo.config.actor.config.initializer}
          units: ${algo.config.models.prior_preprocessor_units}
          activation: ${algo.config.actor.config.activation}
          normalize_obs: ${algo.config.normalize_obs}
          obs_clamp_value: ${algo.config.obs_clamp_value}
          use_layer_norm: ${algo.config.actor.config.use_layer_norm}
          terrain_model: ${algo.config.models.terrain_models.transformer}
          extra_inputs:
            terrain: ${..terrain_model}
            masked_mimic_target_poses: ${algo.config.models.masked_mimic_target_pose_model}
            masked_mimic_target_poses_masks: ${algo.config.models.masked_mimic_target_poses_mask_model}
            motion_text_embeddings: ${algo.config.models.motion_text_embeddings_for_transformer_model}
            motion_text_embeddings_mask: ${algo.config.models.motion_text_embeddings_mask_model}
            historical_pose_obs: ${algo.config.models.historical_poses_for_transformer_model}
            historical_pose_obs_mask: ${algo.config.models.historical_poses_mask_model}
            object_bounding_box_obs: ${algo.config.models.object_bounding_box_for_transformer_model}
            object_bounding_box_obs_mask: ${algo.config.models.object_bounding_box_mask_model}
          latent_dim: 512
          ff_size: 1024
          type_embedding_dim: 0
          num_layers: 4
          num_heads: 4
          dropout: 0
          num_obs_per_target_pose: ${env.config.masked_mimic_obs.num_obs_per_sparse_target_pose}
          num_future_steps: ${env.config.mimic_target_pose.num_future_steps}
          output_decoder: false
          obs_mlp:
            initializer: ${algo.config.actor.config.initializer}
            units: ${algo.config.models.prior_preprocessor_units}
            activation: ${algo.config.actor.config.activation}
            use_layer_norm: ${algo.config.actor.config.use_layer_norm}
            normalize_obs: ${algo.config.normalize_obs}
            obs_clamp_value: ${algo.config.obs_clamp_value}
          output_mlp:
            initializer: ${algo.config.actor.config.initializer}
            units:
            - 1
            activation: ${algo.config.actor.config.activation}
            use_layer_norm: ${algo.config.actor.config.use_layer_norm}
            normalize_obs: false
            obs_clamp_value: null
            num_out: ${algo.config.actor.config.vae_latent_dim}
        num_out: ${algo.config.models.prior_pre_processor.config.latent_dim}
      vae_prior_model:
        _target_: phys_anim.agents.models.mlp.MultiOutputNetwork
        _recursive_: false
        config:
          normalize_obs: false
          obs_clamp_value: null
          trunk: ${algo.config.models.prior_pre_processor}
          outputs:
            mu:
              _target_: phys_anim.agents.models.mlp.MLP_WithNorm
              config:
                initializer: ${algo.config.actor.config.initializer}
                units: ${algo.config.models.prior_output_units}
                activation: ${algo.config.actor.config.activation}
                normalize_obs: false
                obs_clamp_value: null
                use_layer_norm: ${algo.config.actor.config.use_layer_norm}
              num_in: ${algo.config.models.prior_pre_processor.num_out}
              num_out: ${algo.config.actor.config.vae_latent_dim}
            logvar:
              _target_: phys_anim.agents.models.mlp.MLP_WithNorm
              config:
                initializer: ${algo.config.actor.config.initializer}
                units: ${algo.config.models.prior_output_units}
                activation: ${algo.config.actor.config.activation}
                use_layer_norm: ${algo.config.actor.config.use_layer_norm}
                normalize_obs: false
                obs_clamp_value: null
              num_in: ${algo.config.models.prior_pre_processor.num_out}
              num_out: ${algo.config.actor.config.vae_latent_dim}
        num_out: ${algo.config.actor.config.vae_latent_dim}
      vae_latent_model:
        _target_: phys_anim.agents.models.mlp.MLP_WithNorm
        config:
          activation: ${algo.config.actor.config.activation}
          use_layer_norm: ${algo.config.actor.config.use_layer_norm}
          initializer: ${algo.config.actor.config.initializer}
          units: ${algo.config.models.prior_output_units}
          normalize_obs: false
          obs_clamp_value: null
        num_in: ${algo.config.actor.config.vae_latent_dim}
        num_out: ${algo.config.actor.config.vae_latent_dim}
      transformer_obs_units: ${.prior_preprocessor_units}
      mimic_target_pose_model:
        _target_: phys_anim.agents.models.common.Flatten
        config:
          normalize_obs: ${algo.config.normalize_obs}
          obs_clamp_value: ${algo.config.obs_clamp_value}
        num_in: ${eval:${env.config.mimic_target_pose.num_future_steps}*${env.config.mimic_target_pose.num_obs_per_target_pose}}
        num_out: ${.num_in}
      masked_mimic_target_bodies_mask_model:
        _target_: phys_anim.agents.models.common.Flatten
        config:
          normalize_obs: false
          obs_clamp_value: null
          dtype: bool
        num_in: ${eval:${eval:${len:${env.config.masked_mimic_conditionable_bodies}}+1}*2*${env.config.mimic_target_pose.num_future_steps}}
        num_out: ${.num_in}
      masked_mimic_target_poses_mask_model:
        _target_: phys_anim.agents.models.common.Flatten
        config:
          normalize_obs: false
          obs_clamp_value: null
          dtype: bool
        num_in: ${env.config.masked_mimic_obs.masked_mimic_target_poses_num_steps}
        num_out: ${.num_in}
      masked_mimic_target_pose_model:
        _target_: phys_anim.agents.models.mlp.MLP_WithNorm
        config:
          initializer: ${algo.config.actor.config.initializer}
          units: ${algo.config.models.prior_preprocessor_units}
          activation: ${algo.config.actor.config.activation}
          use_layer_norm: ${algo.config.actor.config.use_layer_norm}
          normalize_obs: ${algo.config.normalize_obs}
          obs_clamp_value: ${algo.config.obs_clamp_value}
          encoder_input_dim: ${env.config.masked_mimic_obs.num_obs_per_sparse_target_pose}
          mask_key: masked_mimic_target_poses_masks
          mask_valid_as_zeros: false
          obs_per_body_controller: 12
          operations:
          - type: reshape
            new_shape:
            - -1
            - ${env.config.masked_mimic_obs.num_obs_per_sparse_target_pose}
          - type: encode
          - type: reshape
            new_shape:
            - batch_size
            - ${env.config.masked_mimic_obs.masked_mimic_target_poses_num_steps}
            - ${algo.config.models.masked_mimic_target_pose_model.num_out}
        num_in: ${eval:${env.config.masked_mimic_obs.masked_mimic_target_poses_num_steps}*${env.config.masked_mimic_obs.num_obs_per_sparse_target_pose}}
        num_out: ${algo.config.actor.config.mu_model.config.transformer_token_size}
      motion_text_embeddings_mask_model:
        _target_: phys_anim.agents.models.common.Flatten
        config:
          normalize_obs: false
          obs_clamp_value: null
          dtype: bool
        num_in: 1
        num_out: 1
      motion_text_embeddings_for_transformer_model:
        _target_: phys_anim.agents.models.mlp.MLP_WithNorm
        config:
          initializer: ${algo.config.actor.config.initializer}
          units: ${algo.config.models.prior_preprocessor_units}
          activation: ${algo.config.actor.config.activation}
          use_layer_norm: ${algo.config.actor.config.use_layer_norm}
          normalize_obs: ${algo.config.normalize_obs}
          obs_clamp_value: ${algo.config.obs_clamp_value}
          encoder_input_dim: ${env.config.masked_mimic_obs.text_embedding_dim}
          mask_key: motion_text_embeddings_mask
          mask_valid_as_zeros: false
          operations:
          - type: encode
          - type: reshape
            new_shape:
            - batch_size
            - 1
            - ${algo.config.models.motion_text_embeddings_for_transformer_model.num_out}
        num_in: ${env.config.masked_mimic_obs.text_embedding_dim}
        num_out: ${algo.config.actor.config.mu_model.config.transformer_token_size}
      historical_poses_mask_model:
        _target_: phys_anim.agents.models.common.Flatten
        config:
          normalize_obs: false
          obs_clamp_value: null
          dtype: bool
        num_in: ${env.config.masked_mimic_obs.num_historical_conditioned_steps}
        num_out: ${.num_in}
      historical_poses_for_transformer_model:
        _target_: phys_anim.agents.models.mlp.MLP_WithNorm
        config:
          initializer: ${algo.config.actor.config.initializer}
          units: ${algo.config.models.prior_preprocessor_units}
          activation: ${algo.config.actor.config.activation}
          use_layer_norm: ${algo.config.actor.config.use_layer_norm}
          normalize_obs: ${algo.config.normalize_obs}
          obs_clamp_value: ${algo.config.obs_clamp_value}
          encoder_input_dim: ${env.config.masked_mimic_obs.historical_obs_size_per_pose}
          mask_key: historical_pose_obs_mask
          mask_valid_as_zeros: false
          operations:
          - type: reshape
            new_shape:
            - -1
            - ${env.config.masked_mimic_obs.historical_obs_size_per_pose}
          - type: encode
          - type: reshape
            new_shape:
            - batch_size
            - ${env.config.masked_mimic_obs.num_historical_conditioned_steps}
            - ${algo.config.models.historical_poses_for_transformer_model.num_out}
        num_in: ${eval:${env.config.masked_mimic_obs.num_historical_conditioned_steps}*${env.config.masked_mimic_obs.historical_obs_size_per_pose}}
        num_out: ${algo.config.actor.config.mu_model.config.transformer_token_size}
      object_bounding_box_mask_model:
        _target_: phys_anim.agents.models.common.Flatten
        config:
          normalize_obs: false
          obs_clamp_value: null
          dtype: bool
        num_in: 1
        num_out: 1
      object_bounding_box_for_transformer_model:
        _target_: phys_anim.agents.models.mlp.MLP_WithNorm
        config:
          initializer: ${algo.config.actor.config.initializer}
          units: ${algo.config.models.prior_preprocessor_units}
          activation: ${algo.config.actor.config.activation}
          use_layer_norm: ${algo.config.actor.config.use_layer_norm}
          normalize_obs: ${algo.config.normalize_obs}
          obs_clamp_value: ${algo.config.obs_clamp_value}
          encoder_input_dim: ${env.config.masked_mimic_obs.object_bounding_box_obs_dim}
          mask_key: object_bounding_box_obs_mask
          mask_valid_as_zeros: false
          operations:
          - type: encode
          - type: reshape
            new_shape:
            - batch_size
            - 1
            - ${algo.config.models.object_bounding_box_for_transformer_model.num_out}
        num_in: ${env.config.masked_mimic_obs.object_bounding_box_obs_dim}
        num_out: ${algo.config.actor.config.mu_model.config.transformer_token_size}
    actor:
      _target_: phys_anim.agents.models.actor.ActorFixedSigmaVAE
      _recursive_: false
      config:
        mu_model:
          _target_: phys_anim.agents.models.mlp.MultiHeadedMLP
          _recursive_: false
          config:
            initializer: ${algo.config.actor.config.initializer}
            units:
            - 1024
            - 1024
            - 1024
            activation: ${algo.config.actor.config.activation}
            normalize_obs: ${algo.config.normalize_obs}
            obs_clamp_value: ${algo.config.obs_clamp_value}
            use_layer_norm: ${algo.config.actor.config.use_layer_norm}
            terrain_model: ${algo.config.models.terrain_models.mlp}
            extra_inputs:
              terrain: ${..terrain_model}
              vae_latent: ${algo.config.models.vae_latent_model}
            transformer_token_size: ${algo.config.models.prior_pre_processor.config.latent_dim}
        init_logstd: -2.9
        learnable_sigma: false
        sigma_schedule: null
        use_layer_norm: false
        activation: relu
        initializer: default
        vae_encoder: ${algo.config.models.vae_encoder_model}
        vae_prior: ${algo.config.models.vae_prior_model}
        vae_latent_from_prior: ${vae_latent_from_prior}
        vae_latent_dim: 64
        residual_encoder: true
    critic:
      _target_: phys_anim.agents.models.critic.CriticMLP
      _recursive_: false
      config:
        initializer: default
        units:
        - 1
        activation: relu
        normalize_obs: ${algo.config.normalize_obs}
        obs_clamp_value: ${algo.config.obs_clamp_value}
        use_layer_norm: false
        extra_inputs:
          terrain: ${algo.config.models.terrain_models.mlp}
          mimic_target_poses: ${algo.config.models.mimic_target_pose_model}
          masked_mimic_target_bodies_masks: ${algo.config.models.masked_mimic_target_bodies_mask_model}
    actor_optimizer:
      _target_: torch.optim.Adam
      lr: 2.0e-05
      betas:
      - 0.9
      - 0.999
    critic_optimizer:
      _target_: torch.optim.Adam
      lr: 0.0001
      betas:
      - 0.9
      - 0.999
    actor_lr_scheduler: null
    critic_lr_scheduler: null
    schedules: null
    num_steps: 32
    tau: 0.95
    gamma: 0.99
    e_clip: 0.2
    clip_critic_loss: true
    gradient_clip_val: 50.0
    fail_on_bad_grads: false
    check_grad_mag: true
    bounds_loss_coef: 10
    normalize_values: true
    val_clamp_value: null
    normalize_advantage: true
    normalize_obs: true
    batch_size: 16384
    task_reward_w: 1.0
    num_mini_epochs: 6
    gradient_accumulation_steps: 1
    max_eval_steps: null
    eval_metrics_every: 500
    eval_metric_keys:
    - cartesian_err
    - gt_err
    - dv_rew
    - kb_rew
    - lr_rew
    - rv_rew
    - rav_rew
    - gr_err
    - gr_err_degrees
    training_early_termination:
      early_terminate_cart_err: null
      early_terminate_reward_too_bad_prob: null
    num_games: null
    manual_save_every: 10
    use_rand_action_masks: false
    obs_clamp_value: null
    max_epochs: ${eval:${training_max_steps}//${ngpu}//${num_envs}//${.num_steps}}
    eval_callbacks: null
    extra_inputs:
      vae_latent:
        retrieve_from_env: false
        dtype: float
        size: ${algo.config.actor.config.vae_latent_dim}
      terrain:
        retrieve_from_env: true
        dtype: float
        size: ${terrain.config.terrain_obs_num_samples}
        env_obs_name: terrain_obs
      mimic_target_poses:
        retrieve_from_env: true
        dtype: float
        size: ${algo.config.models.mimic_target_pose_model.num_in}
      masked_mimic_target_poses:
        retrieve_from_env: true
        dtype: float
        size: ${algo.config.models.masked_mimic_target_pose_model.num_in}
      masked_mimic_target_poses_masks:
        retrieve_from_env: true
        dtype: bool
        size: ${algo.config.models.masked_mimic_target_poses_mask_model.num_in}
      masked_mimic_target_bodies_masks:
        retrieve_from_env: true
        dtype: bool
        size: ${algo.config.models.masked_mimic_target_bodies_mask_model.num_in}
      motion_text_embeddings:
        retrieve_from_env: true
        dtype: float
        size: ${env.config.masked_mimic_obs.text_embedding_dim}
      motion_text_embeddings_mask:
        retrieve_from_env: true
        dtype: bool
        size: 1
      historical_pose_obs:
        retrieve_from_env: true
        dtype: float
        size: ${eval:${env.config.masked_mimic_obs.historical_obs_size_per_pose}*${env.config.masked_mimic_obs.num_historical_conditioned_steps}}
      historical_pose_obs_mask:
        retrieve_from_env: true
        dtype: bool
        size: ${env.config.masked_mimic_obs.num_historical_conditioned_steps}
      object_bounding_box_obs:
        retrieve_from_env: true
        dtype: float
        size: ${env.config.masked_mimic_obs.object_bounding_box_obs_dim}
      object_bounding_box_obs_mask:
        retrieve_from_env: true
        dtype: bool
        size: 1
    discriminator:
      _target_: phys_anim.agents.models.discriminator.JointDiscMLP
      _recursive_: false
      config:
        initializer: default
        units:
        - 1
        discriminator_obs_historical_steps: ${env.config.discriminator_obs_historical_steps}
        activation: relu
        normalize_obs: ${algo.config.normalize_obs}
        obs_clamp_value: ${algo.config.obs_clamp_value}
        use_layer_norm: false
        extra_inputs: null
    discriminator_optimizer:
      _target_: torch.optim.Adam
      _recursive_: false
      lr: 0
      betas:
      - 0.9
      - 0.999
    discriminator_lr_scheduler: null
    discriminator_weight_decay: 0.0001
    discriminator_logit_weight_decay: 0.01
    discriminator_batch_size: 4096
    discriminator_reward_w: 2.0
    discriminator_grad_penalty: 5
    discriminator_replay_keep_prob: 0.01
    discriminator_replay_size: 200000
    num_discriminator_mini_epochs: 3
    eval_length: null
    eval_num_episodes: 1
    vae:
      vae_kld_schedule:
        init_kld_coeff: 0.0001
        end_kld_coeff: 0.01
        start_epoch: 3000
        end_epoch: 6000
      vae_noise_type: ${vae_noise_type}
    dagger:
      bc_coeff: 1.0
      gt_actor_path: ${gt_actor_path}
      only_bc: true
      collect_data_with_expert: false
env:
  _target_: phys_anim.envs.masked_mimic.${backbone}.MaskedMimicHumanoid
  _recursive_: false
  config:
    experiment_name: ${experiment_name}
    num_envs: ${num_envs}
    headless: ${headless}
    backbone: ${backbone}
    max_episode_length: 1000
    robot: ${robot}
    humanoid_obs:
      use_max_coords_obs: true
      local_root_obs: true
      root_height_obs: true
    termination_height: 0.15
    head_termination_height: 0.3
    shield_termination_height: 0.32
    enable_height_termination: false
    motion_lib: ${motion_lib}
    motion_index_offset: null
    fixed_motion_id: null
    hybrid_init_prob: 0.0
    state_init: Random
    ref_respawn_offset: ${ref_respawn_offset}
    simulator:
      plane:
        static_friction: 1.0
        dynamic_friction: 1.0
        restitution: 0.0
      sim:
        fps: 60
        control_freq_inv: 2
        substeps: 2
        physx:
          num_threads: 4
          solver_type: 1
          num_position_iterations: 4
          num_velocity_iterations: 0
          contact_offset: 0.02
          rest_offset: 0.0
          bounce_threshold_velocity: 0.2
          max_depenetration_velocity: 10.0
          default_buffer_size_multiplier: 10.0
        flex:
          num_inner_iterations: 10
          warm_start: 0.25
    terrain: ${terrain}
    force_flat_terrain: ${force_flat_terrain}
    scene_lib: ${scene_lib}
    object_types:
    - Armchairs
    - StraightChairs
    - HighStools
    - LowStools
    - Sofas
    - Tables
    - LargeSofas
    object_ref_respawn_offset: 0.1
    visualize_markers: true
    sync_motion: false
    output_motion: false
    camera: null
    export_video: false
    export_motion: false
    record_viewer: false
    viewer_record_dir: output/recordings/viewer
    discriminator_obs_historical_steps: 1
    disable_discriminator: true
    discriminator_obs_size_per_step: ${eval:13+${robot.dof_obs_size}+${robot.number_of_actions}+3*${robot.num_key_bodies}}
    mimic_residual_control: false
    mimic_conditionable_bodies: null
    mimic_fixed_motion_per_env: false
    mimic_motion_sampling:
      init_start_prob: 0.15
      init_random_prob: 0.05
    mimic_early_termination:
    - mimic_early_termination_key: max_joint_err
      mimic_early_termination_thresh: 0.5
      mimic_early_termination_thresh_on_flat: 0.25
      from_other: true
      less_than: false
    mimic_reward_config:
      positive_constant: 0
      tan_norm_reward: false
      relative_kb_pos: false
      unequal_reward_joint_weights: false
      add_rr_to_lr: true
      rt_ignore_height: true
      sum_before_exp: true
      component_weights:
        gr_rew_w: 0.3
        lr_rew_w: 0
        gt_rew_w: 0.5
        rt_rew_w: 0
        rv_rew_w: 0
        rav_rew_w: 0
        gv_rew_w: 0.1
        gav_rew_w: 0.1
        kb_rew_w: 0
        dv_rew_w: 0.0
        rh_rew_w: 0.2
        kbf_rew_w: 0.0
        pow_rew_w: 0.0005
      component_coefficients:
        gt_rew_c: -100
        rt_rew_c: -120
        rv_rew_c: -1
        rav_rew_c: -0.3
        gv_rew_c: -0.5
        gav_rew_c: -0.1
        kb_rew_c: -100
        gr_rew_c: -2
        lr_rew_c: -2
        dv_rew_c: -0.005
        rh_rew_c: -100
        kbf_rew_c: -0.01
    mimic_dynamic_sampling:
      enabled: true
      sampling_criteria: mimic_early_termination
      bucket_width: 2.0
      min_bucket_weight: 1.0e-06
      dynamic_weight_pow: 1.0
      dynamic_weight_max: null
      update_dynamic_weight_epochs: 5
    mimic_reset_track:
      steps_min: 10
      steps_max: 600
      grace_period: 5
      reset_on_episode_reset: false
      reset_episode_on_reset_track: true
    mimic_target_pose:
      enabled: true
      type: max-coords-future-rel
      with_time: false
      num_future_steps: 10
      num_obs_per_target_pose: ${.base_num_obs_per_target_pose}
      base_num_obs_per_target_pose: ${eval:${.num_obs_per_joint}*${robot.num_bodies}}
      num_obs_per_joint: 18
      target_pose_type: max-coords
    masked_mimic_masking:
      joint_masking:
        masked_mimic_time_mask: true
        masked_mimic_time_gap_probability: 0.1
        time_gap_mask_min_steps: 1
        time_gap_mask_max_steps: ${eval:${env.config.mimic_target_pose.num_future_steps}+1}
        with_conditioning_time_gap_mask_max_steps: ${eval:${.time_gap_mask_max_steps}*4}
        with_conditioning_max_gap_probability: 0.2
        masked_mimic_repeat_mask_probability: 0.98
        masked_mimic_fixed_conditioning: null
        force_max_conditioned_bodies_prob: 0.1
        force_small_num_conditioned_bodies_prob: 0.1
      target_pose_visible_prob: 0
      target_pose_joint_probs: 0
      motion_text_embeddings_visible_prob: 0.5
      object_bounding_box_visible_prob: 0.8
      start_without_history_prob: 0
    masked_mimic_obs:
      num_obs_per_sparse_target_pose: ${eval:${.num_obs_per_target_pose}*${eval:${len:${..masked_mimic_conditionable_bodies}}+1}//${robot.num_bodies}+${eval:${len:${..masked_mimic_conditionable_bodies}}+1}*2+2}
      num_future_steps: 10
      num_obs_per_joint: 24
      num_obs_per_target_pose: ${eval:${.num_obs_per_joint}*${robot.num_bodies}}
      text_embedding_dim: 512
      num_historical_stored_steps: 120
      num_historical_conditioned_steps: 15
      historical_obs_size_per_pose: ${eval:${robot.num_bodies}*9+1}
      masked_mimic_report_full_body_metrics: ${masked_mimic_report_full_body_metrics}
      masked_mimic_target_poses_num_steps: ${eval:${env.config.mimic_target_pose.num_future_steps}+1}
      object_bounding_box_obs_dim: 37
    masked_mimic_conditionable_bodies:
    - L_Ankle
    - R_Ankle
    - Pelvis
    - Head
    - L_Hand
    - R_Hand
robot:
  dof_obs_size: 138
  number_of_actions: 69
  self_obs_size: ${.self_obs_max_coords_size}}
  self_obs_max_coords_size: 358
  num_bodies: ${len:${.bfs_body_names}}
  contact_bodies: ${.bfs_body_names}
  bfs_body_names:
  - Pelvis
  - L_Hip
  - R_Hip
  - Torso
  - L_Knee
  - R_Knee
  - Spine
  - L_Ankle
  - R_Ankle
  - Chest
  - L_Toe
  - R_Toe
  - Neck
  - L_Thorax
  - R_Thorax
  - Head
  - L_Shoulder
  - R_Shoulder
  - L_Elbow
  - R_Elbow
  - L_Wrist
  - R_Wrist
  - L_Hand
  - R_Hand
  dfs_body_names:
  - Pelvis
  - L_Hip
  - L_Knee
  - L_Ankle
  - L_Toe
  - R_Hip
  - R_Knee
  - R_Ankle
  - R_Toe
  - Torso
  - Spine
  - Chest
  - Neck
  - Head
  - L_Thorax
  - L_Shoulder
  - L_Elbow
  - L_Wrist
  - L_Hand
  - R_Thorax
  - R_Shoulder
  - R_Elbow
  - R_Wrist
  - R_Hand
  dfs_dof_names:
  - L_Hip_x
  - L_Hip_y
  - L_Hip_z
  - L_Knee_x
  - L_Knee_y
  - L_Knee_z
  - L_Ankle_x
  - L_Ankle_y
  - L_Ankle_z
  - L_Toe_x
  - L_Toe_y
  - L_Toe_z
  - R_Hip_x
  - R_Hip_y
  - R_Hip_z
  - R_Knee_x
  - R_Knee_y
  - R_Knee_z
  - R_Ankle_x
  - R_Ankle_y
  - R_Ankle_z
  - R_Toe_x
  - R_Toe_y
  - R_Toe_z
  - Torso_x
  - Torso_y
  - Torso_z
  - Spine_x
  - Spine_y
  - Spine_z
  - Chest_x
  - Chest_y
  - Chest_z
  - Neck_x
  - Neck_y
  - Neck_z
  - Head_x
  - Head_y
  - Head_z
  - L_Thorax_x
  - L_Thorax_y
  - L_Thorax_z
  - L_Shoulder_x
  - L_Shoulder_y
  - L_Shoulder_z
  - L_Elbow_x
  - L_Elbow_y
  - L_Elbow_z
  - L_Wrist_x
  - L_Wrist_y
  - L_Wrist_z
  - L_Hand_x
  - L_Hand_y
  - L_Hand_z
  - R_Thorax_x
  - R_Thorax_y
  - R_Thorax_z
  - R_Shoulder_x
  - R_Shoulder_y
  - R_Shoulder_z
  - R_Elbow_x
  - R_Elbow_y
  - R_Elbow_z
  - R_Wrist_x
  - R_Wrist_y
  - R_Wrist_z
  - R_Hand_x
  - R_Hand_y
  - R_Hand_z
  bfs_dof_names:
  - L_Hip_x
  - L_Hip_y
  - L_Hip_z
  - R_Hip_x
  - R_Hip_y
  - R_Hip_z
  - Torso_x
  - Torso_y
  - Torso_z
  - L_Knee_x
  - L_Knee_y
  - L_Knee_z
  - R_Knee_x
  - R_Knee_y
  - R_Knee_z
  - Spine_x
  - Spine_y
  - Spine_z
  - L_Ankle_x
  - L_Ankle_y
  - L_Ankle_z
  - R_Ankle_x
  - R_Ankle_y
  - R_Ankle_z
  - Chest_x
  - Chest_y
  - Chest_z
  - L_Toe_x
  - L_Toe_y
  - L_Toe_z
  - R_Toe_x
  - R_Toe_y
  - R_Toe_z
  - Neck_x
  - Neck_y
  - Neck_z
  - L_Thorax_x
  - L_Thorax_y
  - L_Thorax_z
  - R_Thorax_x
  - R_Thorax_y
  - R_Thorax_z
  - Head_x
  - Head_y
  - Head_z
  - L_Shoulder_x
  - L_Shoulder_y
  - L_Shoulder_z
  - R_Shoulder_x
  - R_Shoulder_y
  - R_Shoulder_z
  - L_Elbow_x
  - L_Elbow_y
  - L_Elbow_z
  - R_Elbow_x
  - R_Elbow_y
  - R_Elbow_z
  - L_Wrist_x
  - L_Wrist_y
  - L_Wrist_z
  - R_Wrist_x
  - R_Wrist_y
  - R_Wrist_z
  - L_Hand_x
  - L_Hand_y
  - L_Hand_z
  - R_Hand_x
  - R_Hand_y
  - R_Hand_z
  dof_body_ids: ???
  key_bodies:
  - R_Ankle
  - L_Ankle
  - L_Hand
  - R_Hand
  non_termination_contact_bodies:
  - R_Ankle
  - L_Ankle
  - R_Toe
  - L_Toe
  foot_name: null
  init_state: null
  contact_pairs_multiplier: 16
  num_key_bodies: ${len:${robot.key_bodies}}
  mimic_small_marker_bodies: null
  control:
    control_type: isaac_pd
    stiffness: null
    damping: null
    action_scale: 1.0
    isaac_pd_scale: false
    clamp_actions: 1.0
  asset:
    collapse_fixed_joints: null
    replace_cylinder_with_capsule: null
    flip_visual_attachments: null
    armature: null
    thickness: null
    max_angular_velocity: null
    max_linear_velocity: null
    density: null
    angular_damping: null
    linear_damping: null
    disable_gravity: null
    fix_base_link: null
    default_dof_drive_mode: 1
    robot_type: smpl_humanoid
    asset_file_name: mjcf/${robot.asset.robot_type}.xml
    asset_root: phys_anim/data/assets
    self_collisions: true
    filter_ints:
    - 0
    - 0
    - 7
    - 16
    - 12
    - 0
    - 56
    - 2
    - 33
    - 128
    - 0
    - 192
    - 0
    - 64
    - 0
    - 0
    - 0
    - 0
    - 0
    - 0
    - 0
    - 0
    - 0
    - 0
  dfs_dof_body_ids:
  - 1
  - 2
  - 3
  - 4
  - 5
  - 6
  - 7
  - 8
  - 9
  - 10
  - 11
  - 12
  - 13
  - 14
  - 15
  - 16
  - 17
  - 18
  - 19
  - 20
  - 21
  - 22
  - 23
  right_foot_name: R_Ankle
  left_foot_name: L_Ankle
motion_lib:
  _target_: phys_anim.utils.motion_lib.MotionLib
  motion_file: ${motion_file}
  ref_height_adjust: 0.0
  fix_motion_heights: true
motion_file: ???
scene_lib:
  max_num_objects: null
  scene_yaml_path: ${scene_file}
  num_object_types: 7
  force_single_robot_per_scene: false
  scene_replications: 1
  max_objects_per_scene: 1
scene_file: data/yaml_files/samp_scenes_train.yaml
terrain:
  _target_: phys_anim.envs.env_utils.terrains.terrain.Terrain
  config:
    terrain_composition: curriculum
    map_length: 20.0
    map_width: 20.0
    border_size: 40.0
    num_levels: 10
    num_terrains: 10
    terrain_proportions:
    - 0.2
    - 0.1
    - 0.1
    - 0.1
    - 0.05
    - 0.0
    - 0.0
    - 0.45
    slope_threshold: 0.9
    num_samples_per_axis: 16
    sample_width: 1
    terrain_obs_num_samples: ${eval:${.num_samples_per_axis}**2}
    horizontal_scale: 0.1
    vertical_scale: 0.005
    spacing_between_scenes: 5
    minimal_humanoid_spacing: 0
    terrain_path: null
    load_terrain: false
    save_terrain: false
seed: 0
training_max_steps: 10000000000
codebase_version: 1.0
headless: true
num_envs: 4096
auto_load_latest: false
checkpoint: null
experiment_name: masked_mimic
base_dir: results
save_dir: ${base_dir}/${experiment_name}
vae_latent_from_prior: false
vae_noise_type: normal
gt_actor_path: ???
ref_respawn_offset: 0.25
masked_mimic_report_full_body_metrics: true
backbone: isaacgym
