defaults:
  - polygraph_eval_mmlu_default_instruct
  - cot_processing
  - _self_

experiment_name: mmlu_verb_2s_cot

description: "Provide your best guess for the following question about {subject} selecting one of the options. Before giving your answer, provide a step-by-step explanation of your thought process. Then on a new line give the guess with no other words or explanation.\n\nFor example:\n\nExplanation: <one sentence step-by-step explanation of your thought process>\nGuess: <most likely guess, as short as possible; not a complete sentence, just the guess!>"
few_shot_prompt: "Q:{question}\nA. {choices[0]}\nB. {choices[1]}\nC. {choices[2]}\nD. {choices[3]}\nExplanation: <step-by-step explanation of your thought process>\nGuess:{answer}"
prompt: "Q:{question}\nA. {choices[0]}\nB. {choices[1]}\nC. {choices[2]}\nD. {choices[3]}\n"
max_new_tokens: 200

additional_estimators: 
  - module: lm_polygraph.estimators.verbalized_2s
    class_name: Verbalized2S
    kwargs:
      confidence_prompt: "Provide the probability that your guess is correct. Give ONLY the probability, no other words or explanation.\n\nFor example:\n\nProbability: <the probability between 0.0 and 1.0 that your guess is correct, without any extra commentary whatsoever; just the probability!>"
      confidence_regex: 'Probability: (\d+\.\d+)'
      max_new_tokens: 10 
      name_postfix: "_cot"
