name: small_ffn_ap
model: MoEFfnBlock
ffn_k: 2
ffn_num_experts: 6
task_num: 3
ffn_expert_bias: True
ffn_expert_dim_divisor: 2
num_heads: 8
qkv_bias: False
qk_scale: None
attn_drop: 0.0
proj_drop: 0.0
w_MI: 0.0005
w_H: 0
w_finetune_MI: 0
noisy_gating: False
drop_path: 0.0