data:
    truncation_length: 512
    size: 200000
    batch_size: 10
    val_scale: 10


model:
    model_a_name: 'gpt2-small'
    model_b_name: 'gpt2-medium'
    layer_a: 6
    layer_b: 10
    force_ortho: False
    norm_adjustment: False
    run_inverse: True
    use_bias1: True
    use_bias2: True
    method: 'separate_mat'

sae:
    name: "pythia-70m-deduped-res-sm"

alpha_inv: 1.0
epochs: 2
lr: 0.0001
weight_decay: 0
use_scheduler: True
val_every: 2500

run_sae_eval: False
use_wandb: True
verbose: True
device: 'cuda'
count_flops: True
