# UNet模型配置
type: unet
architecture: ConditionalUnet1D
  
# UNet特定参数
unet:
  input_dim: ${env.dataset.action_dim}
  output_dim: ${env.dataset.action_dim}
  global_cond_dim: ${env.dataset.vision_feature_dim}
  hidden_size: 256
  num_blocks: 4
  num_layers_per_block: 2
  use_attention: true
  
# 条件编码
conditioning:
  use_vision_encoder: true  # 默认启用，可通过环境配置覆盖
  vision_encoder_type: resnet18
  replace_bn_with_gn: true
