defaults:
  - _self_
  - evo/crossover: model_linear
  - evo/mutation: svd_model_weights_gaussian_noise
  - docker_sandbox: default
  - celery: default
  # - experts: default
  - task_generation: default
  - acd: default
  - dns: default

# Data directory for all tasks
data_dir: data

# Enable ACD-DNS integration
use_acd_dns: true

# TODO: CMA-ES baseline
use_cma: false

gpu_memory_utilization: 0.8

svd_expert_names: # null
  - "csbench"
  - "gsm8k"
  - "instruct"

# For qwen 2 7B
base_model_path: "Qwen/Qwen2-7B"
seed_model_paths:
  - "Grogros/Qwen2-7B-OurSafecoder"
  - "Qwen/Qwen2-Math-7B-Instruct"
  - "Qwen/Qwen2-7B-Instruct"
model_stop_token_ids: [151643, 151645] # also for qwen 2
chat_template: "qwen2"

# Logging and monitoring
use_wandb: true
wandb:
  entity: "<your_wandb_entity>"
  project: "acdc"
  name: "acd-dns-integrated"

validation_tasks:
  - csbench
  - gsm8k
  # - mbpp

# Ray configuration for fractional GPU assignment
frac_gpu:
  enabled: false                # Enable Ray for fractional GPU assignment
  gpu_fraction: 0.1           # Fraction of GPU to allocate per worker. With compiled vLLM model, leave some free memory for other processes (e.g. 0.25 -> 0.2)
  workers_per_gpu: 1           # Number of workers to run per GPU
  num_gpus: 1
  gpu_id: 0
  worker_id_in_gpu: 0

vllm_pop:
  stop_token_ids: ${model_stop_token_ids} # EOS tokens for the merged models
  max_tokens: 512
  temperature: 0.0
  top_p: 1.0
  eval_cot: true

# Evaluation parameters
evaluation:
  batch_size: 16                  # Batch size for task evaluation
  timeout: 30                     # Timeout for single example evaluation
  max_retries: 3                 # Maximum retries for failed evaluations
  retry_delay: 1.0               # Delay between retries in seconds

# Output configuration
output_dir: "outputs/acdc"

# Random seed for reproducibility
seed: 42

# Disk cleaning configuration
disk_cleaning_interval: 2        # Clean up old models every N generations
max_models_to_keep: 100          # Maximum number of models to keep on disk
model_cleanup_skip_interval: 5   # 25 for long run, 5 otherwise. Do not delete models for every Nth generation (e.g., keep all models for generations that are multiples of this interval).
save_init_gen_models: true       # Keep Gen 0 Checkpoints for later eval

# Elite evaluation configuration
elite_evaluation_interval: 10000      # Evaluate elite models every N generations

# Wandb additional settings
wandb_resume_id: null

# Restart configuration
restart_dir: null  # Path to checkpoint directory for restarting runs (e.g., '/path/to/outputs/2025-05-26/12-13-52')
