_target_: fusion_bench.method.moe_pruner.MoEPruner

nsamples: 100
seed: 42
device: cuda
max_seqlen: 2048
# `prune_type` can be either `unstructured` or `semistructured`
prune_type: unstructured
# === options for unstructured pruning ===
# `sparsity_ratio` is the ratio of weights to be pruned, 1 means all weights are pruned
sparsity_ratio: 0.5
# === options for semistructured pruning ===
# 2:4 means 2 out of 4 weights are pruned
n: 2
m: 4
