#!/bin/bash
#PBS -N gmd_real_long_run_exp_002
#PBS -l select=1:ncpus=24:mpiprocs=1:mem=120gb
#PBS -P CSCI1368
#PBS -q smp
#PBS -l walltime=24:00:00
#PBS -m abe
#PBS -M xxx@gmail.com

# Set the proxy server details
export LLM_PROXY_HOST="chpclic1"
export LLM_PROXY_PORT="5000"
export LLM_PROXY_TIMEOUT="100"  # Add timeout setting

export OMP_NUM_THREADS=$PBS_NUM_PPN
export MKL_NUM_THREADS=$PBS_NUM_PPN
export OPENBLAS_NUM_THREADS=$PBS_NUM_PPN
export VECLIB_MAXIMUM_THREADS=$PBS_NUM_PPN
export NUMEXPR_NUM_THREADS=$PBS_NUM_PPN
export BLIS_NUM_THREADS=$PBS_NUM_PPN

ln -s $PWD $PBS_O_WORKDIR/$PBS_JOBID

cd $PBS_O_WORKDIR

echo "$PBS_O_WORKDIR/$PBS_JOBID"

module load chpc/python/anaconda/3-2021.11
source /apps/chpc/chem/anaconda3-2021.11/etc/profile.d/conda.sh
conda activate xxx

experiment=gmd_real_long_run_exp_002

# Create directories for output
mkdir -p /gmd/ipp/${experiment}
mkdir -p /gmd/logs/${experiment}

# Function to check if proxy server is available
check_proxy_server() {
    for i in {1..30}; do
        if curl -s http://${LLM_PROXY_HOST}:${LLM_PROXY_PORT}/health > /dev/null; then
            echo "Proxy server is available!"
            return 0
        fi
        echo "Waiting for proxy server... (attempt $i/30)"
        sleep 2
    done
    echo "Failed to connect to proxy server after 30 attempts"
    return 1
}

# Wait for proxy server to be available
echo "Checking proxy server availability..."
if ! check_proxy_server; then
    echo "Error: Proxy server is not available. Please ensure it's running on ${LLM_PROXY_HOST}"
    exit 1
fi

# Run the main script with error handling
echo "Starting generate_run_mcts..."
if ! python -u /gmd/generate_run_mcts.py 2>&1 | tee /gmd/run_${experiment}.log; then
    echo "Error: Test script failed. Check logs for details."
    exit 1
fi