#!/bin/bash
# Run bounded inspiration selector v2 in parallel across 8 GPUs
# Saves both selections and embeddings/similarities
#
# Requirements: torch 2.7+ environment (for specter2_base with safetensors)
#
# Usage: 
#   source activate_torch27.sh
#   bash run_selector_parallel_v2.sh

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
PROJECT_DIR="$(dirname $(dirname $SCRIPT_DIR))"

NUM_WORKERS=8

# ============ Input Directories ============
# MODIFY THESE: Set to your actual data directories
SFT_DIR="${SFT_QA_DATA_DIR:-<YOUR_SFT_QA_DATA_DIR>}"
REC_DIR="${BOUNDED_INSP_DIR:-<YOUR_BOUNDED_INSP_DIR>}/recommendations"

# ============ Output Directories ============
OUTPUT_DIR="${BOUNDED_INSP_DIR:-<YOUR_BOUNDED_INSP_DIR>}/selections"
EMBEDDINGS_DIR="${EMBEDDINGS_CACHE_DIR:-<YOUR_EMBEDDINGS_CACHE_DIR>}"

mkdir -p $OUTPUT_DIR
mkdir -p $EMBEDDINGS_DIR

# Get total file count
TOTAL_FILES=$(ls $REC_DIR/*.json 2>/dev/null | wc -l)
FILES_PER_WORKER=$((TOTAL_FILES / NUM_WORKERS + 1))

echo "=============================================="
echo "Bounded Inspiration Selector v2 - Parallel Run"
echo "=============================================="
echo "Total files: $TOTAL_FILES"
echo "Files per worker: ~$FILES_PER_WORKER"
echo "Output dir: $OUTPUT_DIR"
echo "Embeddings dir: $EMBEDDINGS_DIR"
echo ""

# Launch workers (environment already activated, just use python)
for i in $(seq 0 $((NUM_WORKERS - 1))); do
    CUDA_VISIBLE_DEVICES=$i python $SCRIPT_DIR/bounded_inspiration_selector_worker_v2.py \
        --sft_dir $SFT_DIR \
        --rec_dir $REC_DIR \
        --output_dir $OUTPUT_DIR \
        --embeddings_dir $EMBEDDINGS_DIR \
        --worker_id $i \
        --num_workers $NUM_WORKERS \
        > /tmp/selector_worker_v2_$i.log 2>&1 &
    echo "Launched worker $i on GPU $i (PID: $!)"
done

echo ""
echo "All workers launched."
echo ""
echo "Monitor progress:"
echo "  tail -f /tmp/selector_worker_v2_*.log"
echo ""
echo "Check output counts:"
echo "  watch -n 10 'ls $OUTPUT_DIR | wc -l'"
echo ""
echo "Waiting for all workers to complete..."
wait

echo ""
echo "=============================================="
echo "All workers completed!"
echo "=============================================="

# Count outputs
OUTPUT_COUNT=$(ls $OUTPUT_DIR/*.json 2>/dev/null | wc -l)
EMBED_COUNT=$(ls $EMBEDDINGS_DIR/*.json 2>/dev/null | wc -l)

echo "Outputs: $OUTPUT_COUNT files"
echo "Embeddings: $EMBED_COUNT files"
echo ""
echo "Run summary aggregation if needed."
