project:
  name: ACE-RAG

run:
  output_root: ${ACE_RAG_OUTPUT_DIR:-outputs}
  echo_logs: true
  save_prompts: false
  enable_timing: true
  protocol: common_prompt

logging:
  save_rendered_context: true
  save_full_prompt: false
  rendered_context_preview_chars: 2000

indexing:
  doc_anchor_mode: title
  # ACE-RAG keeps indexing cheap: title entity hub + sentence propositions + packed source chunks.
  # Chunk is a source/provenance span. Retrieval primarily uses propositions.
  max_chunk_tokens: 240
  min_prop_tokens: 2
  chunk_overlap_sentences: 0
  show_progress: true
  embedding:
    enabled: true
    provider: local_nvembed
    backend: transformers
    model_path: ${NVEMBED_MODEL_PATH}
    device: ${EMBED_DEVICE:-cuda}
    device_map: null
    batch_size: 32
    normalize: true
    trust_remote_code: true
    local_files_only: true
    max_seq_length: 32768
    add_eos: true
    query_instruction: "Given a question, retrieve passages that answer the question"
    passage_instruction: ""
    torch_dtype: float16
    model_kwargs:
      torch_dtype: float16
    save_dtype: float16

retrieval:
  retrieval_variant: full_hetero
  seed_selection_variant: global_seed_search
  random_seed: 13
  search_units: [proposition, chunk, entity]
  candidate_top_k: 80
  min_candidate_pool: 80
  candidate_cap:
    enabled: false
    total_candidates: 80
    title_candidates: null
    chunk_candidates: null
    proposition_candidates: null
  optimization:
    stable_dedup_before_seed: false
  seed_count: 4
  seed_trials: 7
  sample_multiplier: 6
  seed_pool_top_k: 80
  diversity_weight: 0.35
  context_token_budget: 3000
  entity_anchor_score: 5.0
  entity_anchor_prop_limit: 16
  scan_titles_in_question: false
  title_scan_limit: 50000
  weights:
    bm25: 0.35
    dense: 0.55
    entity: 0.10
  bm25:
    top_k: 80
    k1: 1.5
    b: 0.75
  dense:
    enabled: true
    top_k: 80
    units: [proposition, chunk]
  bridge:
    enabled: true
    selection: residual_lexical
    max_mentions_per_prop: 3
    max_bridge_titles_per_seed: 2
    max_bridge_props_per_title: 2
    skip_ambiguous_aliases: true
    min_alias_tokens: 2
    remove_self_mentions: true
    ordering: anchor_chain_aware
    anchor_constrained: true
    multi_anchor_bundle: true
    demote_generic_relation_titles: true
    use_automaton: true
  # main.py copies indexing.embedding into retrieval.embedding unless overridden.
  embedding: {}
  refine:
    per_entity_propositions: 4
    per_entity_chunks: 2
    max_bundles: 6

generation:
  provider: vllm
  base_url: ${ACE_RAG_LLM_BASE_URL:-http://127.0.0.1:8013/v1}
  model: ${VLLM_MODEL:-auto}
  temperature: 0.0
  top_p: 1.0
  max_new_tokens: 64
  timeout_s: 120
  retries: 1
  retry_sleep_s: 2.0
  max_context_chars: 16000
  prompt_profile: common_qa
  rendering_profile: structured_chain
  compaction_profile: chain_dedup
  top_bundles: 3
  system_message: ""
  token_counting:
    enabled: true
    tokenizer_model: auto
    fallback_to_estimate: true

eval:
  metrics: [em, f1, answer_contains, support_title_recall, context_tokens, latency_ms]

paper_protocol:
  name: common_prompt
  paper_section: main common-prompt result
  description: Main ACE-RAG common-prompt protocol for the submitted paper.
  fixed_settings:
    doc_anchor_mode: title
    prompt_protocol: common_qa
    rendering_policy: compact_chain_dedup
    rendered_bundle_budget: 3

datasets:
  popqa:
    type: popqa
    qa_path: ${ACE_RAG_DATA_DIR:-data}/popqa/popqa.json
    corpus_path: ${ACE_RAG_DATA_DIR:-data}/popqa/popqa_corpus.json
  hotpotqa:
    type: hotpotqa
    qa_path: ${ACE_RAG_DATA_DIR:-data}/hotpotqa/hotpotqa.json
    corpus_path: ${ACE_RAG_DATA_DIR:-data}/hotpotqa/hotpotqa_corpus.json
  2wiki:
    type: 2wiki
    qa_path: ${ACE_RAG_DATA_DIR:-data}/2wiki/2wikimultihopqa.json
    corpus_path: ${ACE_RAG_DATA_DIR:-data}/2wiki/2wikimultihopqa_corpus.json
  musique:
    type: musique
    qa_path: ${ACE_RAG_DATA_DIR:-data}/musique/musique.json
    corpus_path: ${ACE_RAG_DATA_DIR:-data}/musique/musique_corpus.json
