name: lgm-v1
tags: ["svd"]
description: ""
version: '128_sigmoid scale 0 - 8' # if not specified, will be set to version_{index}
output_dir: "outputs/${name}"

extras:
  resolution: 512
  src_views: 1
  target_views: 6
  bg_color: white
  root_dir: data/gobjaverse/data
  instance_file: data/gobjaverse/gobjaverse_280k_Food.json

seed: 42
# resume: outputs/3dgs-fix/p0gao83a/checkpoints/epoch=189-step=19000.ckpt
data:
  _target_: src.data.gobjaverse.MultiViewDataModule
  train_dataset:
    _target_: src.data.gobjaverse.MultiViewDataset
    root_dir: ${extras.root_dir}
    instance_file: ${extras.instance_file}
    bg_color: ${extras.bg_color}
    img_wh: 
      - ${extras.resolution}
      - ${extras.resolution}
    num_samples: 1
    repeat: 100
  train_batch_size: 1
  val_dataset:
    _target_: src.data.gobjaverse.MultiViewDataset
    root_dir: ${extras.root_dir}
    instance_file: ${extras.instance_file}
    bg_color: ${extras.bg_color}
    img_wh: 
      - ${extras.resolution}
      - ${extras.resolution}
    num_samples: 1
  val_batch_size: 1
  test_dataset:
    _target_: src.data.gobjaverse.MultiViewDataset
    root_dir: ${extras.root_dir}
    instance_file: ${extras.instance_file}
    bg_color: ${extras.bg_color}
    img_wh: 
      - ${extras.resolution}
      - ${extras.resolution}
    num_samples: 1
  test_batch_size: 1
  num_workers: 32
  pin_memory: True


system:
  _target_: src.systems.mv_diffusion.lgm_system.SVDSystem
  lr: 1.0e-5
  base_model_id: stabilityai/stable-video-diffusion-img2vid
  variant: fp16
  cfg: 0.1
  mv_model:
    _target_: src.models.unet.mv_unet.MVModel
    cond_encoder:
      _target_: src.models.unet.adaptor.Adapter_XL
      cin: 768
      sk: True
    _partial_: True

  recon_model:
    _target_: src.models.network.lgm.fix_model.LGM
    opt:
      _target_: src.models.network.lgm.options.Options
      input_size: 256
      up_channels: [1024, 1024, 512, 256, 128]
      up_attention: [True, True, True, False, False]
      splat_size: 128
      output_size: 512
      batch_size: 8
      num_views: 8
      gradient_accumulation_steps: 1
      mixed_precision: fp16



trainer:
  _target_: lightning.pytorch.trainer.Trainer
  default_root_dir: ${output_dir}
  max_steps: 100000
  check_val_every_n_epoch: 2
  log_every_n_steps: 10
  num_sanity_val_steps: 1
  enable_progress_bar: true
  strategy: auto
  accelerator: gpu
  devices: 1
  num_nodes: 1
  precision: 16-mixed
  gradient_clip_val: 1.0

callbacks:
  model_checkpoint:
    _target_: lightning.pytorch.callbacks.ModelCheckpoint
    save_top_k: -1
    every_n_train_steps: 20000
  # point_cloud_checkpoint:
  #   _target_: src.utils.callbacks.PointCloudCallback
  # rich_progress_bar:
    # _target_: lightning.pytorch.callbacks.RichProgressBar

logger:
  # tensorboard:
  #   _target_: lightning.pytorch.loggers.tensorboard.TensorBoardLogger
  #   save_dir: "${output_dir}"
  #   name: ""
  #   version: "${version}"
  #   sub_dir: "tb_logs"
  wandb:
    _target_: lightning.pytorch.loggers.wandb.WandbLogger
    project: "${name}"
    save_dir: "outputs"
    name: "${version}"
  #   # id: p0gao83a
  #   # resume: 'must'