# @package _global_

defaults:
  - override /data: imagenet32
  - override /task/optimizer: adamw
  - override /task/lr_scheduler: cosine
  - override /task/model: bsi/dit

hydra:
  sweeper:
    params:
      seed: 9551795317880672191,6416273688357815109,1220563347313811177
      task: vdm,bfn,bsi

seed: ~
eval_testset: yes

name: ${task.name}-${task.model.name}
title: bsi-${data.name}

data:
  batch_size: 512
  eval_batch_size: 512

task:
  compile: yes
  optimizer:
    lr: 5e-4
    betas: [0.9, 0.99]
    weight_decay: 1e-2
  lr_scheduler:
    end_lr: 5e-5
  model:
    name: DiT-L-2
    patch_size: 2
    dim: 1024
    depth: 24
    heads: 16
    dropout: 0.05

trainer:
  precision: "32"

  max_steps: 1000000
  val_check_interval: 100000
