DATALOADER:
  TRAIN_X:
    BATCH_SIZE: 60
  TEST:
    BATCH_SIZE: 100
  NUM_WORKERS: 8

embed_dim: 1024
quick_gelu: true
vision_cfg:
  image_size: 224
  layers: 32
  width: 1280
  head_width: 80
  patch_size: 14
text_cfg:
  context_length: 77
  vocab_size: 49408
  width: 1024
  heads: 16
  layers: 24
