text_model:
  class: uwul.model.AutoModelForCausalLMFactory
  factory: from_config
  args:
  - ./config/arch/NanoLLaMA-200m.json
  kwargs: #config overrides
    vocab_size: 32013
    torch_dtype: float16
    attn_implementation: flash_attention_2
tokenizer:
  class: transformers.LlamaTokenizer
  factory: from_pretrained
  args:
  - TIPO-Anonymous/TIPO-500M-ft
