#!/bin/bash
# run1_regularization.sh

### Model for Regularization
REGULARIZER_MODEL="x-ai/grok-4.1-fast"
REGULARIZER_TEMPERATURE=0.0

### Dataset for Mining (using a small subset for verification)
DATA_NAME="math_precalculus_5_train"
TOTAL_LIMIT=30
SUBJECT_LIMIT=100
EXP_MAX_TOKENS=1000

### Paths
INPUT_PATH="experiments/exp7_opt_reg/epoch1"
OUTPUT_PATH="experiments/exp7_opt_reg/epoch1_reg"

# Clustering Mode: 'problem' or 'condition'
MODE=${1:-"problem"}

# Log Configuration
SAFE_MODEL=$(echo "${REGULARIZER_MODEL}" | sed 's/\//_/g' | sed 's/:/_/g')
TIMESTAMP=$(date +%Y%m%d_%H%M%S)
LOG_FILE="logs/debug_reg_${SAFE_MODEL}_${MODE}_${TIMESTAMP}.log"

# Configuration
EXPERIENCE_POOL="${INPUT_PATH}/experience_pool.jsonl"
META_FILE="${INPUT_PATH}/question_meta.json"
EXPERIENC_REG_POOL="${OUTPUT_PATH}/experience_pool.jsonl"
META_REG_FILE="${OUTPUT_PATH}/question_meta.json"

# Embedding Files (ensure these exist)
EMBEDDING_MODEL="text-embedding-3-large"
PROBLEM_EMBEDDING_FILE="data/${DATA_NAME}_${EMBEDDING_MODEL}_idx.npz"
EXP_EMBEDDING_FILE="${INPUT_PATH}/experience_idx.npz"

# Run Regularization
# Note: output_path is set to experience_path to overwrite (synchronize) directly
python3 src/agents/regularizer.py \
    --regularizer_model "$REGULARIZER_MODEL" \
    --temperature $REGULARIZER_TEMPERATURE \
    --mode "$MODE" \
    --problem_embedding_path "$PROBLEM_EMBEDDING_FILE" \
    --experience_embedding_path "$EXP_EMBEDDING_FILE" \
    --experience_path "$EXPERIENCE_POOL" \
    --output_path "$EXPERIENC_REG_POOL" \
    --meta_path "$META_FILE" \
    --meta_output_path "$META_REG_FILE" \
    --total_limit $TOTAL_LIMIT \
    --subject_limit $SUBJECT_LIMIT \
    --exp_max_tokens $EXP_MAX_TOKENS \
    --project_name "explearn_reg" \
    --log_file "$LOG_FILE" \
    --debug


