# @package _global_   

defaults: 
  - _self_ 
  - dataset: coco256_features

exp_name: "GM-MMDiT-REPA-ConTr-1.0-1.0-scratch"
output_dir: "exps"
logging_dir: "logs"
seed: 42
allow_tf32: true

t2i:
  resolution: 256
  enc_type: "dinov2-vit-b"
  enc_path: "***************************"
  encoder_depth: 8
  proj_coeff: 0.5
  attn_coeff: 0.0
  prob_path: "CondOT"
  weighting: "uniform"
  early_stop_point: 75000
  #pretrained_model_path: null
  pretrained_model_path: "***********************"

i2t:
  clip_path: "***************************"
  prob_path: "PolynomialDiscrete"
  prob_path_exp: 1.0
  p0_dist: "uniform" # [uniform, masked]
  loss: "generalized_kl" # [cross_entropy, generalized_kl]
  pretrained_model_path: null
  #pretrained_model_path: "***************************"
  params: 
    hidden_size: 768
    cond_dim: 128
    length: 128
    n_blocks: 24
    n_heads: 12
    dropout: 0.1
    compile: true
  
training: 
  image_loss_weight: 1.0
  text_loss_weight: 1.0
  cfg_prob: 0.1
  t2i_learning_rate: 1e-4
  i2t_learning_rate: 1e-4
  adam_beta1: 0.9
  adam_beta2: 0.999
  adam_weight_decay: 1e-5
  adam_epsilon: 1e-8
  max_train_steps: 250000
  epochs: 1000
  max_grad_norm: 1.0
  checkpointing_steps: 200
  prompt_prob: 0.0
  text_guidance_prob: 0.1

sampling: 
  sampling_steps: 200
  num_steps: 200
  cfg_scale: 3.0
  guidance_low: 0.0
  guidance_high: 1.0
  pproc_batch_size: 32
  n_samples: 4096 # 40192 for coco
  extra_text_steps: 1

accelerator:
  gradient_accumulation_steps: 1
  mixed_precision: "bf16" # [no, fp16, bf16]
  report_to: "wandb"

resume_step: 250000
ckpt_dir: "***************************"