number_of_edits: 50
edit_set: 1
alg_name: "MEMIT"
model_name: EleutherAI/pythia-14m
model: EleutherAI/pythia-14m
# llama: meta-llama/Llama-2-7b-chat-hf
# pythia: EleutherAI/pythia-14m
edit_dataset: "counterfact"
stats_dir: "/scratch/sux7mp/stats"
device: 0
tag: "default"
wandb: disabled

layers: [2, 3]
clamp_norm_factor: 0.75
layer_selection: "all"
fact_token: "subject_last"
v_num_grad_steps: 25
v_lr: 5e-1
v_loss_layer: 5
v_weight_decay: 0.5
kl_factor: 0.0625
mom2_adjustment: true
mom2_update_weight: 15000
rewrite_module_tmp: "gpt_neox.layers.{}.mlp.dense_4h_to_h"
layer_module_tmp: "gpt_neox.layers.{}"
mlp_module_tmp: "gpt_neox.layers.{}.mlp"
attn_module_tmp: "gpt_neox.layers.{}.attention"
ln_f_module: "gpt_neox.final_layer_norm"
lm_head_module: "embed_out"
mom2_dataset: "wikipedia"
mom2_n_samples: 100000
mom2_dtype: "float32"
# model_parallel: false
max_length: 40
batch_size: 50
model_parallel: False


# # FT
# lr: 5e-7
# weight_decay: 0
# norm_constraint: false
# num_steps: 25

# Compression
seed: 0
nsamples: 128
sparsity_ratio: 0.3
sparsity_type: unstructured
prune_method: sparsegpt # wanda or sparsegpt
quant_method: gptq
compression_dataset: c4
dataset: c4
percdamp: 0.01
wbits: 8
groupsize: -1
sym: true
nearest: false
new_eval: false
act_order: false
true_sequential: false
static_groups: false
cache_dir: /scratch/sux7mp/llm_weights
use_variant: false
save: out/
save_model: null
eval_zero_shot: false

interventions: ["edit", "prune"]
compress_first: False
edit: False
compress: False
method: prune # prune or quant

load_ckpt: False
ckpt_path: /scratch/sux7mp/saved_models/checkpoint_20231221_113020.pth

save_ckpt: False

edit_train: false
