method:
  _target_: robobase.method.act.ActBCAgent
  is_rl: false
  device: ${device}
  lr: 1e-4
  lr_backbone: 1e-5
  weight_decay: 1e-4
  num_train_steps: ${num_pretrain_steps}
  adaptive_lr: false
  actor_grad_clip: null
  use_lang_cond: False

  actor_model:
    _target_: robobase.models.multi_view_transformer.MultiViewTransformerEncoderDecoderACT
    _partial_: true
    input_shape: ???
    hidden_dim: 512
    enc_layers: 4
    dec_layers: 1
    dim_feedforward: 3200
    dropout: 0.1
    nheads: 8
    num_queries: ${action_sequence}
    pre_norm: false
    state_dim: ???
    action_dim: ???
    use_lang_cond: ${method.use_lang_cond}

  encoder_model:
    _target_: robobase.method.act.ImageEncoderACT
    _partial_: true
    input_shape: ???
    hidden_dim: ${method.actor_model.hidden_dim}
    position_embedding: "sine"
    lr_backbone: ${method.lr_backbone}
    masks: False
    backbone: "resnet18"
    dilation: False
    use_lang_cond: ${method.use_lang_cond}
