# Model arguments
architecture: 'llama'
rope_theta: !!float 1e5
partial_rotary_factor: 1.0
hidden_size: 384
intermediate_size: 1536
num_attention_heads: 6
num_layers: 6
max_position_embeddings: 1024
dropout: 0.0
