{"experiment_name": "benchmark_experiment_gsm8k_qwen_CAPO_44", "random_seed": 44, "budget_per_run": 5000000, "output_dir": "results//gsm8k/qwen/CAPO/seed44/", "dataset": "gsm8k", "model": "vllm-Qwen/Qwen2.5-32B-Instruct-GPTQ-Int4", "model_revision": "c83e67dfb2664f5039fd4cd99e206799e27dd800", "max_model_len": 2048, "batch_size": null, "model_storage_path": "../models/", "optimizer": "CAPO", "n_steps": 999, "population_size": 10, "n_eval_samples": null, "evoprompt_ga_template": "standard", "block_size": 30, "length_penalty": 0.05, "crossovers_per_iter": 4, "upper_shots": 5, "max_n_blocks_eval": 10, "alpha": 0.2, "shuffle_blocks_per_iter": false}