# Hydra configuration for running multiple RSP probability experiments with vLLM
# Covers a grid search over prompt types and temperatures.

# Base configurations (applied unless overridden in a variation)
defaults:
  - model: qwen14b # Default model config group (adjust as needed)
  - prompt: default # Default prompt config group (will be overridden in variations)
  - sampling: default # Default sampling config group (temperature overridden)
  - experiment: base # Default experiment config group (num_samples overridden)
  - _self_

# Base model settings (MUST set model_path and tokenizer_path via CLI or here)
model:
  model_path: Qwen/Qwen2.5-14B-Instruct
  tokenizer_path: Qwen/Qwen2.5-14B-Instruct
  name: qwen14b # Inherited from defaults

# Base prompt settings (words/probs used by all variations unless overridden)
prompt:
  words: ["Rock", "Paper", "Scissors"]
  probabilities: [0.33333, 0.33333, 0.33334] # Uniform probability
  # type: default # Base type, overridden below

# Base sampling settings (temperature overridden below)
sampling:
  temperature: 1.0 # Base temperature, overridden below
  max_tokens: 4096

# Base experiment settings (num_samples used by all variations)
experiment:
  num_samples: 1000 # Set desired number of samples
  output_dir_suffix: "rsp_probability_vllm_grid" # Suffix for the main output folder

# --- List of Experiment Variations ---
# Grid search: 4 prompt types * 9 temperatures = 36 variations
experiments:
  # --- Prompt Type: default ---
  - name: "rsp_default_temp0.0"
    prompt: {type: default}
    sampling: {temperature: 0.0}
  - name: "rsp_default_temp0.2"
    prompt: {type: default}
    sampling: {temperature: 0.2}
  - name: "rsp_default_temp0.4"
    prompt: {type: default}
    sampling: {temperature: 0.4}
  - name: "rsp_default_temp0.6"
    prompt: {type: default}
    sampling: {temperature: 0.6}
  - name: "rsp_default_temp0.8"
    prompt: {type: default}
    sampling: {temperature: 0.8}
  - name: "rsp_default_temp1.0"
    prompt: {type: default}
    sampling: {temperature: 1.0}
  - name: "rsp_default_temp1.2"
    prompt: {type: default}
    sampling: {temperature: 1.2}
  - name: "rsp_default_temp1.4"
    prompt: {type: default}
    sampling: {temperature: 1.4}
  - name: "rsp_default_temp1.6"
    prompt: {type: default}
    sampling: {temperature: 1.6}

  # --- Prompt Type: direct ---
  - name: "rsp_direct_temp0.0"
    prompt: {type: direct}
    sampling: {temperature: 0.0}
  - name: "rsp_direct_temp0.2"
    prompt: {type: direct}
    sampling: {temperature: 0.2}
  - name: "rsp_direct_temp0.4"
    prompt: {type: direct}
    sampling: {temperature: 0.4}
  - name: "rsp_direct_temp0.6"
    prompt: {type: direct}
    sampling: {temperature: 0.6}
  - name: "rsp_direct_temp0.8"
    prompt: {type: direct}
    sampling: {temperature: 0.8}
  - name: "rsp_direct_temp1.0"
    prompt: {type: direct}
    sampling: {temperature: 1.0}
  - name: "rsp_direct_temp1.2"
    prompt: {type: direct}
    sampling: {temperature: 1.2}
  - name: "rsp_direct_temp1.4"
    prompt: {type: direct}
    sampling: {temperature: 1.4}
  - name: "rsp_direct_temp1.6"
    prompt: {type: direct}
    sampling: {temperature: 1.6}

  # --- Prompt Type: code ---
  - name: "rsp_code_temp0.0"
    prompt: {type: code}
    sampling: {temperature: 0.0}
  - name: "rsp_code_temp0.2"
    prompt: {type: code}
    sampling: {temperature: 0.2}
  - name: "rsp_code_temp0.4"
    prompt: {type: code}
    sampling: {temperature: 0.4}
  - name: "rsp_code_temp0.6"
    prompt: {type: code}
    sampling: {temperature: 0.6}
  - name: "rsp_code_temp0.8"
    prompt: {type: code}
    sampling: {temperature: 0.8}
  - name: "rsp_code_temp1.0"
    prompt: {type: code}
    sampling: {temperature: 1.0}
  - name: "rsp_code_temp1.2"
    prompt: {type: code}
    sampling: {temperature: 1.2}
  - name: "rsp_code_temp1.4"
    prompt: {type: code}
    sampling: {temperature: 1.4}
  - name: "rsp_code_temp1.6"
    prompt: {type: code}
    sampling: {temperature: 1.6}

  # --- Prompt Type: fixed_seed ---
  # NOTE: You MUST provide a unique 'fixed_random_string' for each 'fixed_seed' run if you intend to use it.
  # Using the same string repeatedly defeats the purpose unless comparing determinism.
  # A placeholder is added here. Modify or remove these variations if not needed.
  - name: "rsp_fixed_seed_temp0.0"
    prompt: {type: fixed_seed, fixed_random_string: "R4EK4A8ZzeIn9Vbu"}
    sampling: {temperature: 0.0} # Temperature might be less relevant here
  - name: "rsp_fixed_seed_temp0.2"
    prompt: {type: fixed_seed, fixed_random_string: "R4EK4A8ZzeIn9Vbu"}
    sampling: {temperature: 0.2}
  - name: "rsp_fixed_seed_temp0.4"
    prompt: {type: fixed_seed, fixed_random_string: "R4EK4A8ZzeIn9Vbu"}
    sampling: {temperature: 0.4}
  - name: "rsp_fixed_seed_temp0.6"
    prompt: {type: fixed_seed, fixed_random_string: "R4EK4A8ZzeIn9Vbu"}
    sampling: {temperature: 0.6}
  - name: "rsp_fixed_seed_temp0.8"
    prompt: {type: fixed_seed, fixed_random_string: "R4EK4A8ZzeIn9Vbu"}
    sampling: {temperature: 0.8}
  - name: "rsp_fixed_seed_temp1.0"
    prompt: {type: fixed_seed, fixed_random_string: "R4EK4A8ZzeIn9Vbu"}
    sampling: {temperature: 1.0}
  - name: "rsp_fixed_seed_temp1.2"
    prompt: {type: fixed_seed, fixed_random_string: "R4EK4A8ZzeIn9Vbu"}
    sampling: {temperature: 1.2}
  - name: "rsp_fixed_seed_temp1.4"
    prompt: {type: fixed_seed, fixed_random_string: "R4EK4A8ZzeIn9Vbu"}
    sampling: {temperature: 1.4}
  - name: "rsp_fixed_seed_temp1.6"
    prompt: {type: fixed_seed, fixed_random_string: "R4EK4A8ZzeIn9Vbu"}
    sampling: {temperature: 1.6}
