project:
  name: ACE-RAG-smoke

run:
  output_root: ${ACE_RAG_OUTPUT_DIR:-outputs}
  echo_logs: true
  save_prompts: false

logging:
  save_rendered_context: true
  save_full_prompt: false
  rendered_context_preview_chars: 2000

indexing:
  doc_anchor_mode: title
  max_chunk_tokens: 240
  min_prop_tokens: 2
  chunk_overlap_sentences: 0
  show_progress: false
  embedding:
    enabled: false

retrieval:
  retrieval_variant: full_hetero
  seed_selection_variant: global_seed_search
  random_seed: 13
  search_units: [proposition, chunk, entity]
  candidate_top_k: 40
  min_candidate_pool: 40
  candidate_cap:
    enabled: false
    total_candidates: 40
    title_candidates: null
    chunk_candidates: null
    proposition_candidates: null
  optimization:
    stable_dedup_before_seed: false
  seed_count: 3
  seed_trials: 3
  sample_multiplier: 4
  seed_pool_top_k: 40
  diversity_weight: 0.35
  context_token_budget: 2200
  entity_anchor_score: 5.0
  entity_anchor_prop_limit: 12
  scan_titles_in_question: false
  weights:
    bm25: 0.90
    dense: 0.0
    entity: 0.10
  bm25:
    top_k: 40
  dense:
    enabled: false
    top_k: 0
    units: []
  bridge:
    enabled: true
    selection: residual_lexical
    max_mentions_per_prop: 3
    max_bridge_titles_per_seed: 2
    max_bridge_props_per_title: 2
    skip_ambiguous_aliases: true
    min_alias_tokens: 2
    remove_self_mentions: true
    ordering: anchor_chain_aware
    anchor_constrained: true
    multi_anchor_bundle: true
    demote_generic_relation_titles: true
    use_automaton: true
  embedding:
    enabled: false
  refine:
    per_entity_propositions: 4
    per_entity_chunks: 2
    max_bundles: 5

generation:
  provider: none
  max_context_chars: 12000
  prompt_profile: common_qa
  rendering_profile: structured_chain
  compaction_profile: chain_dedup
  top_bundles: 3
  token_counting:
    enabled: true
    tokenizer_model: auto
    fallback_to_estimate: true

eval:
  metrics: [em, f1, answer_contains, support_title_recall, context_tokens, latency_ms]

datasets:
  popqa:
    type: popqa
    qa_path: ${ACE_RAG_DATA_DIR:-data}/popqa/popqa.json
    corpus_path: ${ACE_RAG_DATA_DIR:-data}/popqa/popqa_corpus.json
  hotpotqa:
    type: hotpotqa
    qa_path: ${ACE_RAG_DATA_DIR:-data}/hotpotqa/hotpotqa.json
    corpus_path: ${ACE_RAG_DATA_DIR:-data}/hotpotqa/hotpotqa_corpus.json
  2wiki:
    type: 2wiki
    qa_path: ${ACE_RAG_DATA_DIR:-data}/2wiki/2wikimultihopqa.json
    corpus_path: ${ACE_RAG_DATA_DIR:-data}/2wiki/2wikimultihopqa_corpus.json
  musique:
    type: musique
    qa_path: ${ACE_RAG_DATA_DIR:-data}/musique/musique.json
    corpus_path: ${ACE_RAG_DATA_DIR:-data}/musique/musique_corpus.json
