DATALOADER:
  TRAIN_X:
    BATCH_SIZE: 100
  TEST:
    BATCH_SIZE: 100
  NUM_WORKERS: 8

embed_dim: 768 
quick_gelu: true
vision_cfg:
  image_size: 224
  layers: 24
  width: 1024
  head_width: 80
  patch_size: 14
text_cfg:
  context_length: 77
  vocab_size: 49408
  width: 768
  heads: 12
  layers: 12
