hydra:
  run:
    dir: ${cache_path}/test/

defaults:
  - model: bloomz-560m
  - _self_

cache_path: ./workdir/output
save_path: '${hydra:run.dir}'

task: qa

dataset: SpeedOfMagic/trivia_qa_tiny
train_split: train
eval_split: test
text_column: question
load_from_disk: false
label_column: answer
prompt: ""

generation_params:
  temperature: 0.7
  generate_until:
    - "\n"

ignore_exceptions: false
use_seq_ue: false
use_tok_ue: false
use_density_based_ue: false
use_ens_ue: false
generation_metrics:
  - name: RougeMetric
    args: ["rouge1"]
  - name: BartScoreSeqMetric
    args: ["rh"]
  - name: AccuracyMetric

additional_estimators: 
  - module: lm_polygraph.estimators.perplexity
    class_name: Perplexity
    kwargs: {}

subsample_eval_dataset: 10
batch_size: 2
seed: null
device: null
max_new_tokens: 256
