# hparams/MORE/blip2.yaml

# ================= Model =================
device: 0
name: /models/opt-2.7b
model_name: blip2
model_class: Blip2OPT
tokenizer_class: GPT2Tokenizer
tokenizer_name: /models/opt-2.7b
inner_params: []
opt_precision: bf16

# ================= Method (M-ORE) =================
alg: MORE
rank: 512
lora_alpha: 1024
lora_dropout: 0.0
top_k: 7
eta: 0.1
rls_lambda: 2000
n_last_layers: 12
more_update_mode: online
more_use_masked_z: True
more_restore_p: False
more_score_norm: none
more_eta_vision: null
more_rls_lambda_vision: null
more_nonlinear: none
more_layer_norm: False
more_layer_norm_eps: 1e-5

# ================= Weights for Metrics =================
cedit: 0.1
iedit: 0.1
cloc: 1.0
dropout: 0.0
train_base: False
no_grad_layers: null
archive: null
lr: 1e-6
seed: 42

# ================= Train / Eval =================
batch_size: 1
model_save_pt: 200
silent: False
max_iters: 1000
log_interval: 1
eval_log_interval: 1000
final_eval: True
val_interval: 200
early_stop_patience: 1000
early_stop_key: "loss/total_edit_val"
eval_only: True
half: False
save: False
verbose: True
debug: False

val_batch_size: 1
accumulate_bs: 2
val_steps: 100
opt: Adam # no used
grad_clip: 100.

# ================= Output =================
results_dir: /results/MORE_Eval_BLIP2_OPT

# ================= Multimodal =================
exact_match: False
qformer_checkpoint: hugging_cache/blip2_pretrained_opt2.7b.pth
qformer_name_or_path: bert-base-uncased
state_dict_file: hugging_cache/eva_vit_g.pth
pretrained_ckpt: null

# ================= Image =================
coco_image: /root/data
rephrase_image: /root/data
