alg: enn
lr: 2e-5
edit_lr: 1e-2
seed: 42
debug: False
model_save_pt: 5000
edit_bs: 1
silent: False
#max_iters: 10000 # for counterfact
max_iters: 10000
log_interval: 100
val_interval: 1000 # for counterfact
#val_interval: 5000
lr_lr: 1e-3
batch_size: 1
val_batch_size: 1
accumulate_bs: 10
cedit: 0.1
cloc: 1.0
cbase: 1.0
val_steps: 500
device: 5
#cls_device: 3
#rep_device: 0
device_map: [5]
base_loss: distill
oracle: False
train: True
train_base: True
opt: Adam
single_batch: False
archive: null
grad_clip: 100.
ref: null
early_stop_patience: 40000
early_stop_key: "loss/total_edit_val"
dropout: 0.0
tokenizer: null
model_name: gptneo
dataset_name: counterfact
results_dir: ./results/port/${dataset_name}/${model_name}
#results_dir: ./results/counterfact/gptj # for counterfact
no_grad_layers: null
eval_only: False
half: False
save: False
log_errors: False
unlikelihood: True
generate: False
generate_file: ./models/generate.json
original_generate_file: ./a.json

model:
  pt: ./models/GPT-1.5B.serac

data:
  path: null
  rephrase: true
  zsre_nq: true
  zsre_impl: false
  zsre_impl_path: ${hydra:runtime.cwd}/data/zsre/impl_{}.json
  zsre_yn: false
  zsre_yn_path: ${hydra:runtime.cwd}/data/zsre/zsre_yn_{}.txt
  zsre_eval_idxs: null
  zsre_path: ${hydra:runtime.cwd}/data/zsre/structured_zeroshot-{}-new_annotated_final.jsonl
#  zsre_path: ${hydra:runtime.cwd}/data/counterfact/counterfact-{}.jsonl # for counterfact
  nq_path: ${hydra:runtime.cwd}/data/nq
  wiki_webtext: true
  n_edits: 1
  hard_neg: false
  hard_neg_neighbors: 100
  hard_neg_exclude: 25
  hard_neg_temp: 0.1
  hard_neg_prob: 0.5
  flip_inner_outer: false
  sent_eval_sample: false
  n_outer_max: null

eval:
  verbose: True
  log_interval: 100
  final_eval: True

hydra:
  run:
    dir: ./
  sweep:
    dir: ./outputs/${now:%Y-%m-%d_%H-%M-%S_%f}
    subdir: ${hydra.job.num}
