defaults:
  - base
  - _self_

policy:
  _target_: algos.MSP_DP.MeanFlowScalePolicy
  autoencoder:
    _target_: algos.vae.vae.ActionVAE
    action_dim: ${task.shape_meta.action.shape[0]}
    encoder_dim: 128
    decoder_dim: 128
    skill_block_size: ${algo.skill_block_size}
    downsample_factor: ${algo.downsample_factor}
    attn_pdrop: 0.1
    use_causal_encoder: True
    use_causal_decoder: True
    encoder_heads: 2
    encoder_layers: 2
    decoder_heads: 4
    decoder_layers: 4
    latent_dim: ${algo.latent_action_dim}
    kl_weight: 1e-6

  flowar:
    _target_: algos.flow.flow_ar.FlowAR
    encoder_embed_dim: 256
    encoder_depth: 6
    encoder_num_heads: 4 # 4
    decoder_embed_dim: 256
    decoder_depth: 6
    decoder_num_heads: 4 # 4
    mlp_ratio: 4.0
    norm_layer:
      _target_: torch.nn.LayerNorm
      eps: 1e-6
      normalized_shape: 256
    action_dim: ${algo.latent_action_dim}
    attn_dropout: 0.1
    proj_dropout: 0.1
    scale: [ 1, 2, 4, 8 ]
    obs_in_features: 3086

  image_encoder:
    _target_: algos.vision_image.obs_encoder.ImageObsEncoder
    shape_meta: ${task.shape_meta}
    rgb_model:
      _target_: diffusion_policy.model.vision.model_getter.get_resnet
      name: resnet18
      weights: null
    resize_shape: null
    crop_shape: 0.8
    random_crop: true
    use_group_norm: true
    share_rgb_model: false
    imagenet_norm: true
    use_color_jitter: false
    color_jitter_params:
      brightness: 0.3
      contrast: 0.4
      saturation: 0.5
      hue: 0.08
    transforms:
      - type: RandomResizedCrop
        scale: [ 0.75, 1.0 ]
        ratio: [ 0.75, 1.33 ]
        crop_prob: 1.0


  latent_action_dim: ${algo.latent_action_dim}
  latent_action_chunk: ${eval:'${algo.skill_block_size} // ${algo.downsample_factor}'}
  stage: ${stage}
  action_dim: ${task.shape_meta.action.shape[0]}
  action_chunk: ${algo.skill_block_size}
  n_action_steps: ${task.n_action_steps}
  n_obs_steps: ${task.n_obs_steps}

name: MSP_Real



