# === HUGGINGFACE SETTINGS CONFIGURATION ===
# You can configure all aspects of your huggingface 
hf_configuration:
  token: $HF_TOKEN # you can get one from here: https://huggingface.co/docs/huggingface_hub/en/quick-start#authentication
  hf_organization: $HF_ORGANIZATION # set this env variable to be your username!
  private: false # true by default, set to false to make the dataset publicly viewable!
  hf_dataset_name: yourbench_example # name of the dataset to save the traces, and generated questions to.
  concat_if_exist: false # concatenate the dataset if it already exists

# you can also set this to be a local dataset
# local_dataset_dir: /some/path

# === MODEL CONFIGURATION ===
model_list: 
  # to use the default huggingface inference
  - model_name: Qwen/Qwen2.5-VL-72B-Instruct
    provider:  hf-inference # as a default value
    api_key: $HF_TOKEN
    max_concurrent_requests: 32
  # to use the default huggingface inference
  - model_name: Qwen/Qwen2.5-72B-Instruct
    provider: novita # or another desired provider, the list of available providers is here: https://huggingface.co/docs/huggingface_hub/guides/inference#supported-providers-and-tasks
    api_key: $HF_TOKEN
    max_concurrent_requests: 32

model_roles:
  ingestion:
    - Qwen/Qwen2.5-VL-72B-Instruct # you should use a vision supported model for ingestion
  summarization:
    - Qwen/Qwen2.5-72B-Instruct
  chunking:
    - intfloat/multilingual-e5-large-instruct # your sentence level chunking model
  single_shot_question_generation:
    - Qwen/Qwen2.5-72B-Instruct
  multi_hop_question_generation:
    - Qwen/Qwen2.5-72B-Instruct

pipeline:
  # to convert your documents from their source format to markdown
  ingestion:
    run: true
    # set this to where your raw documents are located
    source_documents_dir: example/data/raw
    # .... and this to where you want them to be processed to
    output_dir: example/data/processed

  # to convert your documents to a huggingface dataset
  upload_ingest_to_hub:
    run: true
    source_documents_dir: example/data/processed

  # to create a global summary of your documents
  summarization:
    run: true
  
  chunking:
    run: true
    chunking_configuration:
      l_min_tokens: 64 # how many minimum tokens you want in each chunk
      l_max_tokens: 128 # how many max tokens in each chunk
      tau_threshold: 0.8 # what threshold to decide a boundary
      h_min: 2 # for multi-hop configurations, minimum number of unique chunks to combine
      h_max: 5 # maximum number of unique chunks to combine to make a multi-hop set
      num_multihops_factor: 2   # or any integer or float. higher numbers generate a larger number of multi-hops
  
  single_shot_question_generation:
    run: true
    # you can add any additional instructions you want here! try it out!
    additional_instructions: "Generate questions to test a curious adult"
    # for cost reduction. if you set all, then all chunks will be used
    chunk_sampling:
      mode: "count" # or "all" for all chunks
      value: 5
      random_seed: 123
  
  multi_hop_question_generation:
    run: true
    additional_instructions: "Generate questions to test a curious adult"
    # for cost reduction
    chunk_sampling:
      mode: "percentage" # or "count" for a fixed number
      value: 0.3
      random_seed: 42

  # this combines your single shot and multi-hop questions into one nice dataset!
  lighteval:
    run: true
