experiment:
  dataset:
    name: qa
    split: test
    n_edits: 2000
  model:
    name: meta-llama/Llama-2-7b-hf
    sim: checkpoints/qa
  gate:
    name: qa
    split: train
    n_edits: 2000
  editor:
    n_experts: 1
    n_epochs: 25
    n_embed: 4096
    threshold: 0.6
    seq: true
    layer: model.layers[0]
    top_k: 1
task: edit
