defaults:
  - base_model

name_or_path: null
block_name: MistralDecoderLayer
attn_implementation: flash_attention_2