backbone: "CLIP-ViT-B/16"
resolution: 224

output_dir: null
print_freq: 10

seed: 0
deterministic: True
gpu: 0
num_workers: 8
prec: "fp16"
adam: True
scheduler: "cosine"
eval_on_val: True

num_epochs: 10
lr: 3e-5
wd: 1e-1
momentum: 0.9
classifier: "CosineClassifier"

head_tuning: True
mask: True
dy_mask: True
mask_momentum: True
mask_ratio: 0.1
mask_ema: 0.3
mask_refresh: 50

init_head: "text_feat"
use_proj: True