hydra:
  run:
    dir: ${cache_path}/mmlu/${model}/${dataset}/${now:%Y-%m-%d}/${now:%H-%M-%S}

defaults:
  - model: bloomz-560m
  - _self_

cache_path: ./workdir/output
save_path: '${hydra:run.dir}'

task: qa

base_manager: null
overwrite_base_estimations: false

dataset: [cais/mmlu, all]
text_column: question
label_column: answer
description: "The following are multiple choice questions (with answers) about {subject}."
prompt: "Q:{question}\nA. {choices[0]}\nB. {choices[1]}\nC. {choices[2]}\nD. {choices[3]}\nAnswer:{answer}"
few_shot_split: dev
train_split: validation
eval_split: test
max_new_tokens: 3
load_from_disk: false
n_shot: 5
max_subject_size: 100
generation_params:
  generate_until:
    - "\n"

save_stats:
  - input_tokens
  - greedy_log_probs
  - greedy_tokens
  - greedy_tokens_alternatives
  - greedy_texts
  - greedy_log_likelihoods

  - mean_all_layers_embeddings
  - last_all_layers_embeddings

  - sample_tokens
  - sample_tokens_alternatives
  - sample_texts
  - sample_log_probs
  - sample_log_likelihoods

  - first_sample_texts
  - first_sample_text_ids
  - best_sample_texts
  - best_sample_text_ids
  - best_normalized_sample_texts
  - best_normalized_sample_text_ids
  - mbr_sample_texts
  - mbr_sample_text_ids

  - semantic_classes_entail
  - semantic_matrix_entail
  - semantic_matrix_contra
  - semantic_matrix_classes
  - sample_sentence_similarity
  - sample_token_similarity
  - token_similarity
  - align_semantic_matrix
  - rouge_semantic_matrix

  - greedy_semantic_matrix_forward
  - greedy_semantic_matrix_backward
  - greedy_semantic_matrix
  - greedy_sentence_similarity_forward
  - greedy_sentence_similarity_backward
  - greedy_sentence_similarity
  - greedy_rouge_semantic_matrix
  - greedy_align_semantic_matrix_forward
  - greedy_align_semantic_matrix_backward
  - greedy_align_semantic_matrix

  - entropy
  - sample_entropy

entropy_top_k: 50

train_dataset: null
train_test_split: false
test_split_size: 1

background_train_dataset: allenai/c4
background_train_dataset_text_column: text
background_train_dataset_label_column: url
background_train_dataset_data_files: en/c4-train.00000-of-01024.json.gz
background_load_from_disk: false

subsample_background_train_dataset: 1000
subsample_train_dataset: 1000
subsample_eval_dataset: -1

use_density_based_ue: false
use_seq_ue: false
use_tok_ue: false
use_ens_ue: false
generation_metrics: null

additional_estimators: []

ignore_exceptions: false

batch_size: 1
deberta_batch_size: 1

seed:
    - 1
