strategy: head_only
num_epochs: 5
batch_size: 16
learning_rate: 2e-4
max_seq_length: 256
freeze_base: true 