num_workers: ${!getenv NUM_WORKERS 1}
prefix_dir: ${!getenv PREFIX}
rematch: ${!getenv REMATCH .*}
corr_config:
  overwrite: ${!getenv OVERWRITE False}
  _pb._skp.${-use_judges switch DO_OTHERS DO_NGRAM}:
    DO_NGRAM:
      use_scores_for_reference_values: ['rouge', 'bleu', 'bleu_adapt']
    DO_WACKY:
      use_scores_for_reference_values: ['bleurt', 'bertscore']
    DO_ALL:
      use_scores_for_reference_values: ['bleurt', 'bertscore', 'rouge', 'bleu', 'bleu_adapt']
  perform_exact_for_bcb: ${!getenv RUN_BCB_ONLINE False}
  _pb._skp.${-use_judges switch DO_JUDGES DO_NOT}:
    TRUE_ORO:
      use_judges:
        - use_model: "meta-llama/llama-3.1-8b-instruct"
        - use_model: "meta-llama/llama-3.3-70b-instruct"
    NON_QA_CONFIG: 
      use_judges:
        - use_model: "meta-llama/llama-3.3-70b-instruct"
          prompt_for_qa: False
        - use_model: "meta-llama/llama-3.1-8b-instruct"
          prompt_for_qa: False
    FULL_KIT:
      use_judges:
        - use_model: "meta-llama/llama-3.1-8b-instruct"
        - use_model: "meta-llama/llama-3.3-70b-instruct"
        - use_model: "meta-llama/llama-3.3-70b-instruct"
          prompt_for_qa: False
        - use_model: "meta-llama/llama-3.1-8b-instruct"
          prompt_for_qa: False
    BIGGEST_MODELS:
      use_judges:
        - use_model: "meta-llama/llama-3.1-405b-instruct"
          prompt_for_qa: False
        - use_model: "meta-llama/llama-3.1-405b-instruct"
          prompt_for_qa: True
    FULL_KIT_UPPED:
      use_judges:
        - use_model: "meta-llama/llama-3.1-8b-instruct"
          use_max_tokens: 16
          temperature: 0.5
        - use_model: "meta-llama/llama-3.3-70b-instruct"
          use_max_tokens: 16
          temperature: 0.5
        - use_model: "meta-llama/llama-3.3-70b-instruct"
          use_max_tokens: 16
          temperature: 0.5
          prompt_for_qa: False
        - use_model: "meta-llama/llama-3.1-8b-instruct"
          use_max_tokens: 16
          temperature: 0.5
          prompt_for_qa: False
    FULL_KIT_REDUNDANT_EDITION:
      use_judges:
        - use_model: "meta-llama/llama-3.1-8b-instruct"
          use_max_tokens: 16
          temperature: 0.49
        - use_model: "meta-llama/llama-3.3-70b-instruct"
          use_max_tokens: 16
          temperature: 0.49
        - use_model: "meta-llama/llama-3.3-70b-instruct"
          use_max_tokens: 16
          temperature: 0.49
          prompt_for_qa: False
        - use_model: "meta-llama/llama-3.1-8b-instruct"
          use_max_tokens: 16
          temperature: 0.49
          prompt_for_qa: False
    FULL_KIT_QA:
      use_judges:
        - use_model: "meta-llama/llama-3.1-8b-instruct"
          use_max_tokens: 16
          temperature: 0.5
        - use_model: "meta-llama/llama-3.3-70b-instruct"
          use_max_tokens: 16
          temperature: 0.5
        - use_model: "meta-llama/llama-3.1-8b-instruct"
          use_max_tokens: 16
          temperature: 0.49
        - use_model: "meta-llama/llama-3.3-70b-instruct"
          use_max_tokens: 16
          temperature: 0.49
    DO_NOT:
      use_judges: null
    FULL_QWEN_KIT:
      use_judges:
        - use_model: "deepseek/deepseek-chat-v3-0324"
          use_max_tokens: 16
          temperature: 0.5
          provider: []
          prompt_for_qa: False
        - use_model: "deepseek/deepseek-chat-v3-0324"
          use_max_tokens: 16
          temperature: 0.5
          provider: []
          prompt_for_qa: True
        - use_model: "qwen/qwen-2.5-72b-instruct"
          use_max_tokens: 16
          temperature: 0.49
          provider: []
          prompt_for_qa: False
        - use_model: "qwen/qwen-2.5-72b-instruct"
          use_max_tokens: 16
          temperature: 0.49
          provider: []
          prompt_for_qa: True
