experiment:
  name: test_step_based
  description: Test configuration for step-based experiment system

paths:
  data: &data_path /Users/gerschld/Desktop/dev/RnD/prompt_optimisation_dataset/data_preprocess

components:
  llm:
    default: OpenAI
    OpenAI:
      version_name: gpt-4o_v2024-11-20_USEAST
      temperature: 0.5
      top_p: 0.95
        
  task:
    default: question_answer
    question_answer:
      data_path: *data_path
      dataset_name: gsm8k
      train_test_flag: test
      # [] to run full dataset
      # [1, 2, 3, 4, 5] to run first 5 examples
      id_lst: []
      prompt_msg_template:
        - role: system
          content: >
            Take a deep breath and work on this problem step-by-step.
        - role: user
          content: "{question}"

  prompt_optimiser:
    default: none
    none:
      psao_intro_prompt: ""
      psao_struct_ann: "(importance ann_var)"
      r_seed: 42
      optimise_user_prompt_flag: false
      optuna_db_name: prompt_opt_test_psao_db.db
      optuna_study_name: test_psao
      optuna_n_trials: 5

steps:
  - name: "init_llm"
    type: "component"
    component_type: "llm"
    component_name: "${components.llm.default}"
  
  - name: "init_task"
    type: "component"
    component_type: "task"
    component_name: "${components.task.default}"
  
  - name: "init_prompt_optimiser"
    type: "component"
    component_type: "prompt_optimiser"
    component_name: "${components.prompt_optimiser.default}"
  
  - name: "optimise_prompt"
    type: "function"
    function: "optimise_prompt"
    depends_on: ["init_llm", "init_task", "init_prompt_optimiser"]
  
  - name: "run_generation"
    type: "function"
    function: "run_generation"
    depends_on: ["init_llm", "init_task", "init_prompt_optimiser", "optimise_prompt"]
  
  - name: "evaluate_results"
    type: "function"
    function: "evaluate_results"
    depends_on: ["run_generation"]

output:
  results_dataframe: output/test_step_based_results.csv