#!/bin/bash

### Model for Mining
INITIALIZER_MODEL="x-ai/grok-4.1-fast"
INITIALIZER_TEMPERATURE=0.0

### Dataset for Mining (using a small subset for verification)
DATA_NAME="math_precalculus_5_test"
MAX_SAMPLES=9999
MAX_WORKERS=10
EMBEDDING_MODEL="text-embedding-3-large"

### Paths
INPUT_PATH="data"
OUTPUT_PATH="${INPUT_PATH}/${DATA_NAME}_${INITIALIZER_MODEL}/"

# Log Configuration
SAFE_MODEL=$(echo "${INITIALIZER_MODEL}" | sed 's/\//_/g' | sed 's/:/_/g')
SAFE_DATASET=$(echo "${DATA_NAME}" | sed 's/\//_/g')
TIMESTAMP=$(date +%Y%m%d_%H%M%S)
LOG_FILE="logs/debug_init_${SAFE_MODEL}_${SAFE_DATASET}_${TIMESTAMP}.log"

# Ensure Output Path exists
mkdir -p "$OUTPUT_PATH"

echo ">>> Running Initialization (Mining) on $DATA_NAME with $INITIALIZER_MODEL ..."
echo "---------------- Configuration ----------------"
echo "INITIALIZER_MODEL:    $INITIALIZER_MODEL"
echo "INITIALIZER_TEMPERATURE:     $INITIALIZER_TEMPERATURE"
echo "EMBEDDING_MODEL:     $EMBEDDING_MODEL"
echo "DATA_NAME:     $DATA_NAME"
echo "MAX_SAMPLES:   $MAX_SAMPLES"
echo "MAX_WORKERS:   $MAX_WORKERS"
echo "OUTPUT_PATH:   $OUTPUT_PATH"
echo "-------------------------------------------------"

python3 src/agents/initializer.py \
    --initializer_model "$INITIALIZER_MODEL" \
    --initializer_temperature $INITIALIZER_TEMPERATURE \
    --input_path "${INPUT_PATH}/${DATA_NAME}.jsonl" \
    --max_samples $MAX_SAMPLES \
    --max_workers $MAX_WORKERS \
    --experience_path "$OUTPUT_PATH" \
    --log_file "$LOG_FILE" \
    --embedding_model "$EMBEDDING_MODEL" \
    --debug

echo ">>> Initialization complete. Check $OUTPUT_PATH for results."
