seed_everything: 0
trainer:
  accelerator: gpu
  strategy: ddp_find_unused_parameters_true
  devices: 4
  num_nodes: 1
  precision: 16-mixed
  logger:
    class_path: lightning.pytorch.loggers.WandbLogger
    init_args:
      save_dir: "vq_log/simvq_1k" #Please specify your own path
      project: "simvq"
      name: "simvq_128_B"
  callbacks:
  - class_path: lightning.pytorch.callbacks.ModelCheckpoint
    init_args:
      dirpath: vq_log/simvq_262k
      filename: null
      monitor: null
      verbose: false
      save_last: null
      save_top_k: -1
      save_weights_only: false
      mode: min
      auto_insert_metric_name: true
      every_n_train_steps: null
      train_time_interval: null
      every_n_epochs: null
      save_on_train_epoch_end: null
      enable_version_counter: true
  - class_path: lightning.pytorch.callbacks.LearningRateMonitor
    init_args:
      logging_interval: step
      log_momentum: false
      log_weight_decay: false
  fast_dev_run: false
  max_epochs: 50
  min_epochs: null
  max_steps: -1
  min_steps: null
  max_time: null
  limit_train_batches: null
  limit_val_batches: null
  limit_test_batches: null
  limit_predict_batches: null
  overfit_batches: 0.0
  val_check_interval: null
  check_val_every_n_epoch: 1
  num_sanity_val_steps: 0
  log_every_n_steps: 100
  enable_checkpointing: null
  enable_progress_bar: null
  enable_model_summary: null
  accumulate_grad_batches: 1
  gradient_clip_val: null
  gradient_clip_algorithm: null
  deterministic: null
  benchmark: null
  inference_mode: true
  use_distributed_sampler: true
  profiler: null
  detect_anomaly: false
  barebones: false
  plugins: null
  sync_batchnorm: false
  reload_dataloaders_every_n_epochs: 0
  default_root_dir: null
ckpt_path: null
model:
  class_path: taming.models.vq.VQModel
  init_args:
    ddconfig:
      double_z: false
      z_channels: 128
      resolution: 128
      in_channels: 3
      out_ch: 3
      ch: 128
      ch_mult:
      - 1
      - 2
      - 2
      - 4
      num_res_blocks: 2
      norm_type: "groupnorm"  # Options: "batchnorm", "layernorm", "instancenorm", "groupnorm"
      norm_groups: 32  # Number of groups for GroupNorm (only used when norm_type="groupnorm")
    lossconfig:
      target: taming.modules.losses.vqperceptual.VQLPIPSWithDiscriminator
      params:
        disc_conditional: false
        disc_in_channels: 3
        disc_start: 0
        disc_weight: 0.8
        gen_loss_weight: 0.1
        codebook_weight: 0.1
        commit_weight: 1.0
        codebook_enlarge_ratio: 0
        codebook_enlarge_steps: 2000
    quantconfig:
      target: taming.modules.vqvae.simvq.VQ
      params:
        n_e: 16384
        e_dim: 128
        beta: 0.25
        legacy: false
        embedding_init: "gaussian"
        l2_norm: false  # Whether to use L2 normalization on codebook and input
        num_groups: 1  # Number of groups for disentanglement loss (only used when disentangle_loss_type="codebook" or "z_q")
        disentangle_loss_type: "codebook_orth"  # Options: "codebook", "z_q", "codebook_orth", "z_q_orth"
        disentangle_loss_weight: 0.0  # Weight for disentanglement loss
        inner_loss_weight: 0.0  # Weight for inner-group variance loss (only used when num_groups > 1)
    ckpt_path: null
    ignore_keys: []
    image_key: image
    colorize_nlabels: null
    monitor: null
    learning_rate: 0.0001
    warmup_epochs: 1.0
    scheduler_type: None
    min_learning_rate: 0
    use_ema: true
    stage: null
    log_image_every_n_steps: 1
    no_vq: true
data:
  class_path: main.DataModuleFromConfig
  init_args:
    batch_size: 64
    train:
      target: taming.data.imagenet.ImageNetTrain
      params:
        config:
          size: 128
          subset: null
    validation:
      target: taming.data.imagenet.ImageNetValidation
      params:
        config:
          size: 128
          subset: null
    test:
      target: taming.data.imagenet.ImageNetValidation
      params:
        config:
          size: 128
          subset: null
    wrap: false
    num_workers: 8