optimizer :
  type: AdamW
  kwargs:
    lr: 0.0005
    weight_decay: 0.0005


scheduler:
  type: CosLR
  kwargs:
    epochs: 300
    initial_epochs : 10

dataset:
  train:
    _base_: cfgs/dataset_configs/ShapeNet-55.yaml
    others: 
      subset: train
      npoints: 1024
  val:
    _base_: cfgs/dataset_configs/ShapeNet-55.yaml
    others: 
      subset: test
      npoints: 1024
  test:
    _base_: cfgs/dataset_configs/ShapeNet-55.yaml
    others: 
      subset: test
      npoints: 1024


temp:
  start: 1
  target: 0.0625
  ntime: 100000 


kldweight:
  start: 0
  target: 0.1
  ntime: 100000


model:
  NAME: ACTPromptedDiscreteVAEwithVIT
  # NAME: ACTPromptedDiscreteVAEwithBERT # special for BERT
  # ViT
  visual_embed_type: vit_base_patch16_384
  # visual_embed_type: vit_small_patch16_384
  # visual_embed_type: vit_base_r50_s16_224_in21k
  # visual_embed_type: vit_base_r50_s16_384
  # DEiT
  # visual_embed_type: deit_small_distilled_patch16_224
  # visual_embed_type: deit_base_distilled_patch16_384
  # BEiT
  # visual_embed_type: beit_base_patch16_384
  # visual_embed_type: beit_large_patch16_512
  # CLIP
  # visual_embed_type: CLIP:ViT-B/16
  # MLP-Mixer
  # visual_embed_type: mixer_b16_224_in21k
  # visual_embed_type: mixer_b16_224_miil
  # visual_embed_type: resmlp_24_distilled_224
  # BERT:
  # visual_embed_type: 
  # visual_embed_dim: 384
  visual_embed_dim: 768
  visual_embed_pos: after_dgcnn1
  freeze_visual_embed: true
  num_prompt_token: 0
  # num_prompt_token: 132 # especifically for MLP-Mixer with patch size 16
  use_deep_prompt: false
  num_group: 64
  group_size: 32
  num_tokens: 8192
  encoder_dims: 384
  tokens_dims: 384
  decoder_dims: 384


npoints: 1024
total_bs: 64
step_per_update: 1
max_epoch: 300
grad_norm_clip: 10


consider_metric: CDL1
