description: Jigsaw example
name: model-interventions
parameters:
  dataset: ["jigsaw"]
  positive_subset:
  - toxic
  negative_subset:
  - non-toxic
  num_workers: 4
  pooling_op: ['max']
  seed: 42
  model_path: "meta-llama/Llama-3.1-8B-Instruct"
  module_names: ['model.layers.*.mlp.gate_proj', 'model.layers.*.mlp.up_proj', 'model.layers.*.mlp.down_proj']
  tag: "toxicity-responses"
  intervention: "aura"
  num_experts: null
command:
  "${PYTHON} -m scripts.learn_aura"