# Model Configuration
wandb:
  entity: null
#  run_id: askkz9i2
  resume: 'auto'
model:
  pretrained_model_name_or_path: ""
  pretrained_model_name_or_path_con: "checkpoints/magvitv2"
  stage1:
    pretrained_model: ''
    discriminator_config_name_or_path: ''
    discriminator3d_config_name_or_path: ''
  model_config_name_or_path: null
  discriminator_config_name_or_path: null
  model_type: "ctx_vqgan"  # Options: ['vqgan', 'ctx_vqgan']
  use_ema: true #false
  enable_xformers_memory_efficient_attention: false
  disc_depth: 4
  selected_params: false
  weighted_mse: null
  weighted_gan: false
  latest_checkpoint_only: false
  context_model_train: true #false
  dynamic_model_train: true #false
  cond_enable: true #false
  maskIM: false
  load_checkpoint: true
  gan_check_point: ""
  disc_check_point: ""

  vq_model:
    type: "magvitv2"
    latent_size: 4
    patch_size: 2

# Data Configuration
dataset:
  gen_type: "OpenDV"
  video_root:
    opendv: '/dataset'
    opendvmini: '/OPendvmini'

  json_root: 'dataset'
  dataset_use: 'Tokenizer_TRAINGIN'
  mix_data:
     'OPENDV_MINI': 'opendvmini'
     'OPENDV_FULL': 'opendv'
  params:
    dataset_size: null
    cache_dir: null
    video_stepsize: 1
    rand_select: true
    use_datasets: false
    segment_length: 11
    context_length: 2 #2
    segment_horizon: 30
    strong_aug: false
    no_aug: false
    skip_first_val: false
    resolution_h: 128 #256
    resolution_w: 224 #448
    Con_resolution_h: 256
    Con_resolution_w: 448
    resolution: [128, 224] #[256,448]
    oxe_data_mixes_type: "debug"

optimizer:
  name: adamw
  params:
    adam_beta1: 0.9
    adam_beta2: 0.999
    adam_weight_decay: 0.0
    adam_epsilon: 1e-08
    start_global_step: 0
    discr_learning_rate: 1e-4
    learning_rate: 2e-4
    scale_lr: false
    lr_scheduler: "cosine"  # Options: ['linear', 'cosine', 'cosine_with_restarts', 'polynomial', 'constant', 'constant_with_warmup']
    discr_lr_scheduler: "constant_with_warmup"
    max_grad_norm: 10.0

# Training Configuration
training:
  name: 'cx_magvit-v2'
  seed: 0
  train_batch_size: 2 #4
  val_batch_size: 24 #24
  num_train_epochs: 500
  lr_warmup_steps: 500
  max_train_steps: 1000000
  gradient_accumulation_steps: 4
  gradient_checkpointing: false
  use_8bit_adam: false
  allow_tf32: false
  dataloader_num_workers: 8
  log_grad_norm_steps: 50000
  log_steps: 100
  validation_steps: 5000
  log_image_steps: 200
  logging_dir: "logs"
  report_to: "tensorboard"  # Options: ['tensorboard', 'wandb', 'comet_ml', 'all']
  tracker_project_name: "vqgan-training"
  vae_loss: "l1"
  checkpointing_steps: 10000
  resume_from_checkpoint: null
  mixed_precision: "bf16"
  selected_params: true
  balanced_loss: false
  perc_weight: 2.0
  recon_weight: 5.0
  Commitment loss weight: 0.5
  Entropy loss weight: 1
  disc_start: 0
  disc_weight: 1
  dy_epy_weight: 5
  skip_first_val: true #false
  num_workers: 4
  start_global_step: 0
  stage: 1
  recon_min_weight: 1e-5
  save_check_start: 5000
# Output and Experiment Configuration
output:
  output_dir: "resume_checkpoint/vqgan_stage"
  exp_name: "vq_LR_2e-4_80w_step_2x"
