flux_path: "black-forest-labs/FLUX.1-dev"
dtype: "bfloat16"

model:
  independent_condition: false

train:
  accumulate_grad_batches: 1
  dataloader_workers: 5
  save_interval: 1000
  sample_interval: 100
  max_steps: -1
  gradient_checkpointing: true # (Turn off for faster training)
  save_path: "runs"

  # 使用三个条件：subject + position + background
  condition_type: "subject_position_background"
  dataset:
    type: "subject_position_background"
    condition_size:
      - 512
      - 512
    target_size: 
      - 512
      - 512
    image_size: 512
    padding: 8
    
    # Dropout 概率（用于 Classifier-Free Guidance 训练）
    drop_text_prob: 0.1          # 文本 dropout
    drop_subject_prob: 0       # Subject 参考图 dropout
    drop_position_prob: 0      # Position mask dropout
    drop_background_prob: 0    # Background 图像 dropout
    
    # Fill mask 生成参数
    min_mask_ratio: 0         # 遮挡区域最小占比（图像面积的 15%）
    max_mask_ratio: 0.6          # 遮挡区域最大占比（图像面积的 60%）
    
    # Background 生成参数
    background_blur_prob: 0.3    # 背景模糊概率（30%）
    
    # 可选：使用外部背景数据集
    use_external_background: false  # 设为 true 启用外部背景
    background_urls:
      # (取消注释以使用 text-to-image-2M 作为背景源)
      # - "https://huggingface.co/datasets/jackyhate/text-to-image-2M/resolve/main/data_512_2M/data_000045.tar"
      # - "https://huggingface.co/datasets/jackyhate/text-to-image-2M/resolve/main/data_512_2M/data_000046.tar"

  wandb:
    project: "OminiControl"
    name: "triple_condition_control"

  lora_config:
    r: 16
    lora_alpha: 16
    init_lora_weights: "gaussian"
    target_modules: "(.*x_embedder|.*(?<!single_)transformer_blocks\\.[0-9]+\\.norm1\\.linear|.*(?<!single_)transformer_blocks\\.[0-9]+\\.attn\\.to_k|.*(?<!single_)transformer_blocks\\.[0-9]+\\.attn\\.to_q|.*(?<!single_)transformer_blocks\\.[0-9]+\\.attn\\.to_v|.*(?<!single_)transformer_blocks\\.[0-9]+\\.attn\\.to_out\\.0|.*(?<!single_)transformer_blocks\\.[0-9]+\\.ff\\.net\\.2|.*single_transformer_blocks\\.[0-9]+\\.norm\\.linear|.*single_transformer_blocks\\.[0-9]+\\.proj_mlp|.*single_transformer_blocks\\.[0-9]+\\.proj_out|.*single_transformer_blocks\\.[0-9]+\\.attn.to_k|.*single_transformer_blocks\\.[0-9]+\\.attn.to_q|.*single_transformer_blocks\\.[0-9]+\\.attn.to_v|.*single_transformer_blocks\\.[0-9]+\\.attn.to_out)"

  optimizer:
    type: "Prodigy"
    params:
      lr: 1
      use_bias_correction: true
      safeguard_warmup: true
      weight_decay: 0.01
