backbone: "CLIP-ViT-B/16"
resolution: 224

output_dir: null
print_freq: 10

seed: 0
deterministic: True
gpu: 0
num_workers: 8
prec: "fp16"
adam: True
scheduler: "cosine"
eval_on_val: True

num_epochs: 10
lr: 0.01
wd: 5e-4
momentum: 0.9
classifier: "CosineClassifier"

init_head: "text_feat"
head_tuning: True
use_proj: True