model_args:
  pretrained_model_name_or_path: "allenai/OLMo-2-0425-1B"
  attn_implementation: 'flash_attention_2'
  torch_dtype: bfloat16
  revision: "stage1-step100000-tokens210B"
  # load_in_8bit: true
  # device_map: "auto"
tokenizer_args:
  pretrained_model_name_or_path: "allenai/OLMo-2-0425-1B"
  revision: "stage1-step100000-tokens210B"
template_args:
  apply_chat_template: False
  user_start_tag: "<|user|>"
  user_end_tag: "\n"
  asst_start_tag: "<|assistant|>"
  asst_end_tag: "\n"