DATALOADER:
  TRAIN_X:
    BATCH_SIZE: 3
  TEST:
    BATCH_SIZE: 1
  NUM_WORKERS: 1

INPUT:
  SIZE: (224, 224)
  INTERPOLATION: "bicubic"
  PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
  PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
  TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]

OPTIM:
  NAME: "sgd"
  LR: 0.02
  MAX_EPOCH: 100
  LR_SCHEDULER: "cosine"

TRAIN:
  PRINT_FREQ: 50

MODEL:
  BACKBONE:
    NAME: "ViT-B/16"

TRAINER:
  CMPT:
    N_DACTX: 2
    N_DSTKN: 2
    CTX_INIT: "a photo of a"
    PROMPT_DEPTH: 12
    L: 10
    W: 0.001

