defaults:
  - base         
  - _self_

model_log_name: qwen3_8b
model_name_or_path: Qwen/Qwen3-8B      

model_args:
  model_revision: main
  torch_dtype: bfloat16
  attn_implementation: flash_attention_2          

tokenizer:
  model_revision: ${model_args.model_revision}