defaults:
  - base
  - _self_

mode: eval

eval:
  batch_size: 16
  num_trials: 5 # number of sampling performed per iter, evaluate ASR@k (k=num_trials * len(max_new_tokens_list))
  prompter:
    max_new_tokens_list:
      - 30
      - 50
  data:
    suffix_dataset_dir: "${output_dir}/suffix_dataset"
    dataset_pth_dct:
      train: "data/harmful_behaviors/dataset/full_train.csv"
      # validation: "data/harmful_behaviors/dataset/full_validation.csv"
      test: "data/harmful_behaviors/dataset/full_test.csv"