name: old
model: MoEBlock
num_heads: 8
mlp_ratio: 4.0
qkv_bias: False
qk_scale: None
drop: 0.0
attn_drop: 0.0
drop_path: 0.0
num_total_experts: 6
num_active_experts: 2
task_num: 3
