data:
  batch_size: 4
  dataset:
    data_dir: /path/to/data
    delta_t: 1
    downsample: 1
    num_testing_trajs: -1
    num_training_trajs: -1
    start_time: 0
    trajlen: 48
    use_embed: false
  drop_last: true
  mode: ns2D
  normalizer:
    scaler: normal
    stat_path: /path/to/normalizer/stats
    use_norm: true
  num_workers: 16
load_dir: /path/to/eval/dir
model:
  base_learning_rate: 1.0e-05
  beta_schedule: linear
  channels: 16
  clip_denoised: false
  cond_stage_config:
    conditional: true
    encoder:
      attn_resolutions:
      - 16
      ch_mult:
      - 1
      - 2
      - 4
      - 4
      cond_channels: 128
      dim: 2
      double_z: false
      dropout: 0.0
      hidden_channels: 128
      in_channels: 3
      num_res_blocks: 2
      out_channels: 512
      resolution:
      - 128
      - 128
      tanh_out: false
      z_channels: 512
    out_dim: 512
    pretrained: false
    use_fourier: true
  cond_stage_trainable: true
  cosine_s: 0.008
  dist: true
  first_stage_config:
    aeconfig:
      decoder:
        attn_resolutions:
        - 16
        ch_mult:
        - 1
        - 2
        - 4
        - 4
        cond_channels: 1
        double_z: true
        dropout: 0.0
        hidden_channels: 64
        in_channels: 16
        num_res_blocks: 2
        out_channels: 3
        resolution:
        - 48
        - 128
        - 128
        tanh_out: false
        z_channels: 16
      encoder:
        attn_resolutions:
        - 16
        ch_mult:
        - 1
        - 2
        - 4
        - 4
        cond_channels: 1
        double_z: true
        dropout: 0.0
        hidden_channels: 64
        in_channels: 3
        num_res_blocks: 2
        out_channels: 16
        resolution:
        - 48
        - 128
        - 128
        tanh_out: false
        z_channels: 16
    lossconfig:
      kl_weight: 2.0e-07
    pretrained_path: /path/to/pretrained/autoencoder
    training:
      dist: true
  image_size:
  - 6
  - 16
  - 16
  linear_end: 0.012
  linear_start: 0.00085
  log_every_t: 200
  model_config:
    context_dim: 512
    depth: 28
    dim: 3
    hidden_size: 1024
    in_channels: 16
    input_size:
    - 6
    - 16
    - 16
    learn_sigma: false
    mlp_ratio: 4.0
    num_heads: 16
    patch_size:
    - 1
    - 2
    - 2
    use_cross_attn: true
  monitor: val/loss
  num_timesteps_cond: 1
  parameterization: eps
  scale_factor: 0.2
  scheduler_config:
    scheduler: cosine
  timesteps: 1000
model_path: /path/to/model/to/eval
training:
  accelerator: gpu
  accumulate_grad_batches: 1
  check_val_every_n_epoch: 10
  checkpoint: null
  dataset_size: 2496
  default_root_dir: logs/
  devices: 1
  ema_decay: null
  ema_every_n_steps: 1
  gradient_clip_val: 1.0
  limit_train_batches: 300
  limit_val_batches: 70
  log_every_n_steps: 32
  max_epochs: 1000
  seed: 42
  strategy: auto
wandb:
  name: LDM_NS2D_DiT_FF
  project: ldm_diffusion
