{
    "n_skills": 8,
    "n_splits": 1,
    "model_modifier": "poly_lora",
    "lora_rank": 16,
    "lora_modules": ".*SelfAttention|.*EncDecAttention|.*DenseReluDense",
    "lora_layers": "q|k|v|o",
    "poly_granularity": "finegrained",
    "trainable_param_names": ".*lora_[ab].*|.*module_logits.*", 
    "module_logits_learning_rate": 0.1,
    "adapters_learning_rate": 1e-3,
    "adafactor_scale_parameter": false
}
