# @package _global_
defaults:
  - override /pipeline: cifar
  - override /model: s3
  # - override /optimizer: adamw
  # - override /callbacks:
  #   - base

loader:
  batch_size: 50
model:
  dropout: 0.25
  n_layers: 6
  d_model: 1024

# Optimizer
# optimizer: adamw
optimizer:
  lr: 1e-2
  weight_decay: 0.01
# model.layer.0.lr.dt: 1e-3

# Scheduler
trainer:
  max_epochs: 200
# scheduler: cosine_warmup
train:
  seed: 1111
  # scheduler: plateau
  #   num_warmup_steps: 1000
  #   num_training_steps: 400000
