model_name_or_path: microsoft/Phi-3-mini-4k-instruct
use_peft: True
lora_alpha: 64
lora_r: 128
lora_target_modules: "all-linear"
attn_implementation: "flash_attention_2"
torch_dtype: bfloat16
init_embed: null
# init_embed:
#   path: null
#   mode: mean
#   in_scale: 1
#   out_scale: null