experiment:
  dataset:
    name: qa
    split: test
    n_edits: 1000
  model:
    name: meta-llama/Llama-2-7b-hf
    sim: checkpoints/qa
  gate:
    name: qa
    split: train
    n_edits: 1000
  editor:
    n_experts: 5
    n_epochs: 25
    n_embed: 4096
    threshold: 0.6
    seq: true
    layer: model.layers[0]
    top_k: 4
task: edit
