model:
  base_learning_rate: 2.5e-6
  target: ldm.models.autoencoder.AutoencoderKL
  params:
    monitor: "val/rec_loss"
    embed_dim: 8
    use1d: True
    use_one_embedding: True
    mixup_prob: 0.8
    
    lossconfig:
      target: ldm.modules.losses.LPIPSLoss
      params:
        disc_start: 50001
        kl_weight: 0.000001
        disc_weight: 0.5
        disc_in_channels: 1
        perceptual_weight: 0.0

    ddconfig:
      double_z: True
      z_channels: 8
      resolution: 2048
      in_channels: 1
      out_ch: 1
      ch: 128
      ch_mult: [ 1,1,1,1,2,2,2,2 ]  # num_down = len(ch_mult)-1
      num_res_blocks: 2
      attn_resolutions: [ ]
      dropout: 0.0
      # use_linear_attn: True
      attn_type: none

data:
  target: main.DataModuleFromConfig
  params:
    batch_size: 34
    num_workers: 2
    wrap: True
    train:
      target: ldm.data.metadiff.load_data
      params:
        data_dir: merged_sub_ctx_values_dict.pt
        dataset_mode: coop
        image_size: 2048
        is_train: True
        coprompt: True
    validation:
      target: ldm.data.metadiff.load_data
      params:
        data_dir: merged_sub_ctx_values_dict.pt
        dataset_mode: coop
        image_size: 2048
        is_train: False
        coprompt: True

  trainer:
    benchmark: True
    # accumulate_grad_batches: 2
    epochs: 30000
    log_every_n_steps: 10
    find_unused_parameters: False

