debug:
  dim: 16
  num_attn_heads: 2
  depth: 1

# 5.5M
tiny: # vit_tiny_patch16_224
  dim: 192
  num_attn_heads: 3
  depth: 12

# 21.5M
small: # vit_small_patch16_224
  dim: 384
  num_attn_heads: 6
  depth: 12

# 85.6M
base:
  dim: 768
  num_attn_heads: 12
  depth: 12

# 303M
large:
  dim: 1024
  num_attn_heads: 16
  depth: 24

# 630M
huge:
  dim: 1280
  num_attn_heads: 16
  depth: 32
