dataset:
  # Arithmetic datasets
  aqua:
    path_test: "dataset/test/aqua/test_full.json"
    prompt: "prompts/aqua"
  gsm8k:
    path_test: "dataset/test/gsm8k/test_full.json"
    prompt: "prompts/arithmetic"
  gsm-ic:
    path_test: "dataset/test/gsm-ic/test_full.json"
    prompt: "prompts/arithmetic"
  svamp:
    path_test: "dataset/test/svamp/test_full.json"
    prompt: "prompts/arithmetic"

  # Commonsense datasets
  csqa:
    path_test: "dataset/test/csqa/test_full.json"
    prompt: "prompts/csqa"
  sqa:
    path_test: "dataset/test/sqa/test_full.json"
    prompt: "prompts/sqa"
  socialiqa:
    path_test: "dataset/test/socialiqa/test_full.json"
    prompt: "prompts/socialiqa"

  # Symbolic datasets
  coin_flips:
    path_test: "dataset/test/coin_flips/test_full.json"
    prompt: "prompts/coin_flips"
  last_letters:
    path_test: "dataset/test/last_letters/test_full.json"
    prompt: "prompts/last_letters"

  # BBH
  date:
    path_test: "dataset/test/bbh/date/test.json"
    prompt: "prompts/bbh/date"
  causal_judgement:
    path_test: "dataset/test/bbh/causal_judgement/test.json"
    prompt: "prompts/bbh/causal_judgement"
  ruin_names:
    path_test: "dataset/test/bbh/ruin_names/test.json"
    prompt: "prompts/bbh/ruin_names"
  reasoning_about_colored_objects:
    path_test: "dataset/test/bbh/reasoning_about_colored_objects/test.json"
    prompt: "prompts/bbh/reasoning_about_colored_objects"
  logical_deduction:
    path_test: "dataset/test/bbh/logical_deduction/test_full.json"
    prompt: "prompts/bbh/logical_deduction"
  tracking_shuffled_objects:
    path_test: "dataset/test/bbh/tracking_shuffled_objects/test_full.json"
    prompt: "prompts/bbh/tracking_shuffled_objects"