#!/bin/bash
set -euo pipefail
. experiments/include.bash
. src/recognizers/functions.bash

# Check for required arguments
if [ "$#" -lt 1 ]; then
  echo "Usage: $0 <sweep_id> [--count NUM_AGENTS] [--validation-data SET] [--trial-no TRIAL] [--num-languages NUM]"
  echo
  echo "Options:"
  echo "  <sweep_id>              The W&B sweep ID (e.g., ymntf9hj)"
  echo "  --count NUM_AGENTS      Number of agents to start (default: 10)"
  echo "  --validation-data SET   Validation dataset (default: validation-short)"
  echo "  --num-languages NUM     Number of languages to sample for each run (default: 5)"
  exit 1
fi

SWEEP_ID=$1
shift

# Default values
COUNT=10
VALIDATION_DATA="validation-short"
NUM_LANGUAGES=5

# Parse additional arguments
while [[ $# -gt 0 ]]; do
  case "$1" in
    --count)
      COUNT="$2"
      shift 2
      ;;
    --validation-data)
      VALIDATION_DATA="$2"
      shift 2
      ;;
    --num-languages)
      NUM_LANGUAGES="$2"
      shift 2
      ;;
    *)
      echo "Unknown option: $1"
      exit 1
      ;;
  esac
done

# Construct full sweep ID
SWEEP_ID_FULL="$WANDB_ENTITY/nn-ch-hyperparam-search/$SWEEP_ID"

# Ensure CSV file exists
LANGUAGES_CSV="$BASE_DIR/languages/random/random_languages.csv"
if [ ! -f "$LANGUAGES_CSV" ]; then
  echo "Error: Languages CSV file not found at $LANGUAGES_CSV"
  exit 1
fi

# Count number of languages in the CSV
NUM_TOTAL_LANGUAGES=$(tail -n +2 "$LANGUAGES_CSV" | wc -l | xargs)
echo "Found $NUM_TOTAL_LANGUAGES random languages in $LANGUAGES_CSV"

echo "Starting $COUNT agents for sweep $SWEEP_ID..."

# Create scripts directory if it doesn't exist
SCRIPTS_DIR="$(pwd)/experiments/training/sweep_scripts"
mkdir -p "$SCRIPTS_DIR"

# Launch sweep agents
for i in $(seq 1 $COUNT); do
  echo "Launching agent $i of $COUNT"
  
  # Create agent script in a location accessible from compute nodes
  AGENT_SCRIPT="${SCRIPTS_DIR}/agent_${SWEEP_ID}_${i}.sh"
  
  # Write the script content
  cat > "$AGENT_SCRIPT" << EOF
#!/bin/bash
cd "$(pwd)"
export WANDB_ENTITY="$WANDB_ENTITY"
export WANDB_PROJECT=nn-ch-hyperparam-search
export LANGUAGES_FILE="$LANGUAGES_CSV"
export VALIDATION_DATA="$VALIDATION_DATA"
export NUM_LANGUAGES="$NUM_LANGUAGES"
export BASE_DIR="$BASE_DIR"

# Print some debug info
echo "======= AGENT $i DEBUG INFO =======" >&2
echo "Running wandb agent for sweep $SWEEP_ID_FULL" >&2
echo "AGENT_ID: \$AGENT_ID" >&2
echo "WANDB_ENTITY: \$WANDB_ENTITY" >&2
echo "WANDB_PROJECT: \$WANDB_PROJECT" >&2
echo "LANGUAGES_FILE: \$LANGUAGES_FILE" >&2
echo "VALIDATION_DATA: \$VALIDATION_DATA" >&2
echo "NUM_LANGUAGES: \$NUM_LANGUAGES" >&2
echo "BASE_DIR: \$BASE_DIR" >&2
echo "Current directory: \$(pwd)" >&2
echo "=================================" >&2

# Run the agent with command-line arguments
wandb agent $SWEEP_ID_FULL
EOF
  export AGENT_ID="$i"
  chmod +x "$AGENT_SCRIPT"
  
  JOB_NAME="sweep_${SWEEP_ID}_agent$i"
  
  # Submit job
  submit_job \
    "$JOB_NAME" \
    cpu \
    --mem-per-cpu=8G \
    --time=24:00:00 \
    -- "$AGENT_SCRIPT"
    
  echo "Submitted job $JOB_NAME with script $AGENT_SCRIPT"
done

echo "All $COUNT agents launched for sweep $SWEEP_ID"
echo "Monitor progress at: https://wandb.ai/$WANDB_ENTITY/nn-ch-hyperparam-search/sweeps/$SWEEP_ID"
echo "-----------------------------------------------------"
echo "Agent scripts are in $SCRIPTS_DIR"
