config_anchors:
  data_path: &data_path /Users/anjin.liu/Documents/GitHub/prompt_optimisation_dataset/data_preprocess
  dataset_name: &dataset_name gsm8k
  experiment_name: &experiment_name gsm8k_baseline
  experiment_description: &experiment_description GSM8K experiment with no system prompt
  results_path: &results_path output/gsm8k_baseline_results.csv

experiment:
  name: *experiment_name
  description: *experiment_description

components:
  llm:
    default: OpenAI
    OpenAI:
      # version_name: gpt-4o_v2024-11-20_USEAST
      # version_name: bedrock-claude-4-sonnet
      version_name: gemini-2.0-flash-001
      temperature: 0.5
      top_p: 0.95

  task:
    default: question_answer
    question_answer:
      data_path: *data_path
      dataset_name: *dataset_name
      train_test_flag: test
      # to run full dataset
      # id_lst: []
      id_lst: []
      prompt_msg_template:
        - role: system
          content: >
            Take a deep breath and work on this problem step-by-step.
        - role: user
          content: "{question}"

steps:
  - name: "init_llm"
    type: "component"
    component_type: "llm"
    component_name: "${components.llm.default}"
  
  - name: "init_task"
    type: "component"
    component_type: "task"
    component_name: "${components.task.default}"

  - name: "run_generation"
    type: "function"
    function: "run_generation"
    depends_on: ["init_llm", "init_task"]
  
  - name: "evaluate_results"
    type: "function"
    function: "evaluate_results"
    depends_on: ["run_generation"]

output:
  results_dataframe: output/gsm8k_baseline_results.csv