flux_path: "black-forest-labs/FLUX.1-dev"
dtype: "bfloat16"

model:
  independent_condition: false

train:
  accumulate_grad_batches: 1
  batch_size: 8
  dataloader_workers: 8
  save_interval: 200
  sample_interval: 200
  max_steps: -1
  gradient_checkpointing: True
  save_path: "runs"
  resume_from_checkpoint: null  # 从checkpoint恢复，例如: "runs/20241124-130000/ckpt/1000"
  save_optimizer_state: false    # 是否保存optimizer状态（设为false可节省显存）

  # 航空目标三条件控制（单文件夹）
  condition_type: "aircraft_single_folder"
  dataset:
    type: "aircraft_single_folder"
    
    # 数据集路径（单文件夹，包含 Original, Masks, Background_Erased, Crops）
    dataset_root: "/data2/aaa/datasets/semgen/"
    
    # 图像尺寸
    condition_size:
      - 512
      - 512
    target_size: 
      - 512
      - 512
    
    # Dropout 概率（用于 Classifier-Free Guidance 训练）
    drop_text_prob: 0          # 文本 dropout
    drop_subject_prob: 0       # Subject 参考图 dropout
    drop_position_prob: 0      # Position mask dropout
    drop_background_prob: 0    # Background 图像 dropout
    
    # Fill mask 生成参数
    min_mask_ratio: 0          # 遮挡区域最小占比
    max_mask_ratio: 0.6        # 遮挡区域最大占比
    
    # Background 生成参数
    background_blur_prob: 0  # 背景模糊概率
    
    # 数据增强参数
    augmentation_prob: 0.5     # 应用几何变换的概率
    rotation_prob: 0.5         # 旋转概率
    flip_prob: 0.5             # 翻转概率
    color_jitter_prob: 0.5     # 颜色抖动概率
    brightness_range:
      - 0.8
      - 1.2
    contrast_range:
      - 0.8
      - 1.2
    saturation_range:
      - 0.8
      - 1.2
    hue_range:
      - -0.1
      - 0.1

  wandb:
    project: "OminiControl"
    name: "aircraft_single_folder"

  lora_config:
    r: 16
    lora_alpha: 16
    init_lora_weights: "gaussian"
    target_modules: "(.*x_embedder|.*(?<!single_)transformer_blocks\\.[0-9]+\\.norm1\\.linear|.*(?<!single_)transformer_blocks\\.[0-9]+\\.attn\\.to_k|.*(?<!single_)transformer_blocks\\.[0-9]+\\.attn\\.to_q|.*(?<!single_)transformer_blocks\\.[0-9]+\\.attn\\.to_v|.*(?<!single_)transformer_blocks\\.[0-9]+\\.attn\\.to_out\\.0|.*(?<!single_)transformer_blocks\\.[0-9]+\\.ff\\.net\\.2|.*single_transformer_blocks\\.[0-9]+\\.norm\\.linear|.*single_transformer_blocks\\.[0-9]+\\.proj_mlp|.*single_transformer_blocks\\.[0-9]+\\.proj_out|.*single_transformer_blocks\\.[0-9]+\\.attn.to_k|.*single_transformer_blocks\\.[0-9]+\\.attn.to_q|.*single_transformer_blocks\\.[0-9]+\\.attn.to_v|.*single_transformer_blocks\\.[0-9]+\\.attn.to_out)"

  optimizer:
    type: "Prodigy"
    params:
      lr: 1
      use_bias_correction: true
      safeguard_warmup: true
      weight_decay: 0.01
