# hparams/MORE/minigpt4.yaml

# ================= Model =================
device: 0  
name: /models/Xorbits/vicuna-7b-v1.5  
model_name: minigpt4  
model_class: Blip2OPT  
tokenizer_class: LlamaTokenizer  
tokenizer_name: /models/Xorbits/vicuna-7b-v1.5 
inner_params: []  

# ================= Method (M-ORE) =================
alg: MORE  
rank: 512  
lora_alpha: 1024  
lora_dropout: 0.0 
top_k: 7 
eta: 0.1 
rls_lambda: 2000  
n_last_layers: 12 
more_update_mode: online  
more_use_masked_z: True  
more_restore_p: False 
more_score_norm: none 
more_eta_vision: null  
more_rls_lambda_vision: null 
more_nonlinear: none  
more_layer_norm: False 
more_layer_norm_eps: 1e-5

# ================= Weights for Metrics =================
cedit: 0.1  # weight for text edit loss
iedit: 0.1  # weight for image edit loss
cloc: 1.0  # weight for locality losses (text + image)
dropout: 0.0 
train_base: False  
no_grad_layers: null 
archive: null  
lr: 1e-6 
seed: 42  

# ================= Train / Eval =================
batch_size: 1 
model_save_pt: 200 
silent: False 
max_iters: 1000  
log_interval: 1 
eval_log_interval: 1000 
final_eval: True 
val_interval: 200  
early_stop_patience: 1000 
early_stop_key: "loss/total_edit_val" 
eval_only: True  
half: False  
debug: False 
save: False 
verbose: True  

val_batch_size: 1 
accumulate_bs: 2  
val_steps: 100  
opt: Adam  
grad_clip: 100.  

# ================= Output =================
results_dir: /root/results/MORE_Eval  

# ================= Multimodal =================
exact_match: False  
qformer_checkpoint: /models/blip2_pretrained_flant5xxl.pth  # Q-Former weights
qformer_name_or_path: bert-base-uncased  # Q-Former config/tokenizer name
state_dict_file: /models/eva_vit_g.pth  # EVA ViT weights
pretrained_ckpt: /models/prerained_minigpt4_7b.pth  # MiniGPT4 checkpoint

# ================= Image =================
coco_image: /root/data  # image root for CaptionDataset
rephrase_image: /root/data  # rephrase image root for CaptionDataset
