# Hydra configuration for the Random Generation Experiment

defaults:
  - _self_
  # Add other defaults if needed, e.g., for logging or specific environments
  # - override hydra/job_logging: colorlog
  # - override hydra/hydra_logging: colorlog

hydra:
  run:
    # Output directory pattern: outputs/YYYY-MM-DD/HH-MM-SS
    dir: outputs/${experiment.name}/${now:%Y-%m-%d_%H-%M-%S}
  sweep:
    # Output directory pattern for multirun: multirun/YYYY-MM-DD/HH-MM-SS
    dir: multirun/${experiment.name}/${model.litellm_model_name}/${now:%Y-%m-%d_%H-%M-%S}
    subdir: ${hydra.job.num} # Subdirectory for each run in a multirun sweep

experiment:
  # Name for the experiment (used potentially in logging/output paths)
  name: "random_generation_test"

  # Parameters for the random integer generation
  min_value: 0       # Minimum value for the random integer (inclusive)
  max_value: 127 # Maximum value for the random integer (inclusive)

  # Number of samples (LLM calls) to generate
  num_samples: 1000

  # Optional suffix for the output directory within the hydra run folder
  output_dir_suffix: "random_gen_results"

  # Whether to use budget forcing instead of standard batch completion
  use_budget_forcing: true

  # Number of parallel workers for budget forcing (if enabled)
  parallel_workers: 100

  # Number of "Wait" token insertions for budget forcing (if enabled)
  num_wait_insertion: 4
  
  max_think_tokens: 512

  is_sequential_request: false
  only_str: false
  only_int: false

model:
  # Name used for identifying the model in outputs/logs
  name: "s1.1-32B" # e.g., qwen, deepseek, gemini

  # LiteLLM model string (e.g., "openai/gpt-4", "anthropic/claude-3-opus-20240229", "google/gemini-pro")
  # Ensure this matches a model supported by your LiteLLM setup/proxy
  litellm_model_name: hosted_vllm/simplescaling/s1.1-32B
  tokenizer_name: Qwen/Qwen2.5-32B-Instruct

  # API Base URL (if using a proxy or self-hosted model)
  api_base: http://localhost:8318/v1
  # api_base: "http://0.0.0.0:4000" # Example for local proxy

  # API Key (use environment variables for security in real scenarios)
  api_key: null # Set via environment variable (e.g., OPENAI_API_KEY) or directly if needed
  # api_key: "sk-..."

sampling:
  # Temperature for sampling randomness (0.0 = deterministic, >1.0 = more random)
  temperature: 0.7

  # Maximum number of tokens to generate in the response
  max_tokens: 30000
  top_p: 0.95

  # Add other sampling parameters if needed (e.g., top_p, top_k)
