# K-module MT-STS configuration for OpenEvolve

max_iterations: 50
checkpoint_interval: 10
log_level: "INFO"
random_seed: 123
language: "python"
file_suffix: ".py"

# This family is a combinatorial configuration search, so full rewrites are
# a better fit than diff-based evolution.
diff_based_evolution: false
max_code_length: 10000

llm:
  api_base: "http://127.0.0.1:4000"
  api_key: "litellm"
  primary_model: "claude-sonnet-4-6"
  primary_model_weight: 1.0
  secondary_model: null
  secondary_model_weight: 0.0
  temperature: 0.9
  max_tokens: 4096
  timeout: 60
  retries: 3

prompt:
  system_message: |
    You are optimizing a four-module pipeline configuration over a hidden
    family of related tasks.

    The pipeline modules are:
    - loader: ['csv_reader', 'json_reader', 'xml_reader', 'parquet_reader', 'sql_reader']
    - preprocess: ['normalize', 'standardize', 'minmax', 'scale', 'none']
    - algorithm: ['quicksort', 'mergesort', 'heapsort', 'bubblesort', 'insertion']
    - formatter: ['json', 'xml', 'csv', 'yaml', 'protobuf']

    Important:
    - In shared mode, the score is the average over multiple hidden tasks.
    - Feedback is aggregate only; do not assume you know which single module is wrong.
    - Explore combinations systematically and reuse high-scoring building blocks.

  num_top_programs: 5
  num_diverse_programs: 3
  include_artifacts: true
  max_artifact_bytes: 10240

database:
  population_size: 25
  archive_size: 15
  num_islands: 5
  elite_selection_ratio: 0.15
  exploration_ratio: 0.6
  exploitation_ratio: 0.25
  feature_dimensions: ["complexity", "diversity"]
  feature_bins: 5
  migration_interval: 3
  migration_rate: 0.3

evaluator:
  timeout: 30
  max_retries: 2
  cascade_evaluation: false
  parallel_evaluations: 4
  use_llm_feedback: false
  enable_artifacts: true

early_stopping_patience: 100
convergence_threshold: 0.001
early_stopping_metric: "combined_score"
