# GPT2 small model configuration
name_or_path: gpt2
tokenizer_name_or_path: null
archive: null
block_name: GPT2Block
policy_dtype: float32  # Changed to float32 for better numerical stability
fsdp_policy_mp: null
reference_dtype: float32  # Changed to float32 for better numerical stability 