# PromptKD with LMC regularization
DATALOADER:
  TRAIN_X:
    BATCH_SIZE: 8
  TEST:
    BATCH_SIZE: 100
  NUM_WORKERS: 8

INPUT:
  SIZE: (224, 224)
  INTERPOLATION: "bicubic"
  PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
  PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
  TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]

OPTIM:
  NAME: "sgd"
  LR: 0.005
  MAX_EPOCH: 20
  LR_SCHEDULER: "cosine"
  WARMUP_EPOCH: 1
  WARMUP_TYPE: "constant"
  WARMUP_CONS_LR: 1e-5

TRAIN:
  PRINT_FREQ: 20

MODEL:
  BACKBONE:
    NAME: "ViT-B/16"

TEST:
  FINAL_MODEL: "best_val"
  NO_TEST: False

TRAINER:
  PROMPTKD:
    N_CTX_VISION: 4
    N_CTX_TEXT: 4
    CTX_INIT: "a photo of a"
    PREC: "fp16"
    PROMPT_DEPTH_VISION: 9
    PROMPT_DEPTH_TEXT: 9
    TEACHER_NAME: "ViT-L/14"
    PROJECT_LAYER: 2
    CE_WEIGHT: 0.0
    KD_WEIGHT: 1000.0
    TEMPERATURE: 1.0
    
    # LMC Regularization Settings
    USE_LMC: True
    LAMBDA_REG: 0.1          # λ coefficient for L2 regularization ||w_student - w_pretrained_student||²
    BETA_LMC: 0.5            # β coefficient for LMC connectivity loss
    NUM_SAMPLES: 10          # Number of interpolation points for LMC connectivity
    PRETRAINED_STUDENT_PATH: null  # Path to pretrained student model (optional)

