#!/bin/bash
# Local test script for GRU model - BLEU comparison
# Usage: ./run_gru_test_local.sh

set -e  # Exit on error

echo "========================================"
echo "BLEU Comparison Test - GRU (Local)"
echo "========================================"
echo "Start Time: $(date)"
echo ""

# ===== Environment Setup =====
# Set data directories (adjust paths as needed for your desktop)
export SCRATCH="${SCRATCH:-$(pwd)/data}"
export DATASET_PATH="${SCRATCH}/wmt_datasets"
export TOKENIZER_CACHE="${SCRATCH}/tokenizer_cache"
export CHECKPOINT_DIR="${SCRATCH}/checkpoints/test"
export WANDB_DIR="${SCRATCH}/wandb_logs"
export WANDB_CONFIG_DIR="${SCRATCH}/wandb_config"
export WANDB_CACHE_DIR="${SCRATCH}/wandb_cache"
export WANDB_PROJECT="bleu-comparison-test"

# CUDA/GPU configuration
export CUDA_VISIBLE_DEVICES=0
export MKL_THREADING_LAYER=GNU
export PYTHONUNBUFFERED=1
export PYTHONWARNINGS="ignore::UserWarning"
export MPLBACKEND=agg

# ===== Create necessary directories =====
echo "Creating directories..."
mkdir -p "${DATASET_PATH}"
mkdir -p "${TOKENIZER_CACHE}"
mkdir -p "${CHECKPOINT_DIR}"
mkdir -p "${WANDB_DIR}"
mkdir -p "${WANDB_CONFIG_DIR}"
mkdir -p logs/gru_local

echo "Environment configuration:"
echo "  SCRATCH: ${SCRATCH}"
echo "  DATASET_PATH: ${DATASET_PATH}"
echo "  TOKENIZER_CACHE: ${TOKENIZER_CACHE}"
echo "  CHECKPOINT_DIR: ${CHECKPOINT_DIR}"
echo "  WANDB_PROJECT: ${WANDB_PROJECT}"
echo ""

# ===== Configuration =====
# CONFIG="configs/wmt/unsynced_gru_new.json"
# CONFIG="configs/wmt/transformer_new.json"
# CONFIG="configs/wmt/unsynced_rnn_new.json"
CONFIG="configs/wmt/unsynced_recurrent_difflogic_new.json"
MODEL_NAME="unsynced_recurrent_difflogic"

# Verify config file exists
if [ ! -f "${CONFIG}" ]; then
    echo "ERROR: Config file not found: ${CONFIG}"
    echo "Please ensure you're running from the project root directory"
    exit 1
fi

echo "Model: ${MODEL_NAME}"
echo "Config: ${CONFIG}"
echo ""

# ===== Check Python environment =====
echo "Checking Python environment..."
python3 --version
echo ""

# Check if required packages are installed
echo "Checking required packages..."
python3 -c "import torch; print(f'PyTorch: {torch.__version__}')" || {
    echo "ERROR: PyTorch not found. Please install requirements:"
    echo "  pip install -r Singularity/requirements.txt"
    exit 1
}

python3 -c "import sacrebleu; print(f'sacreBLEU: {sacrebleu.__version__}')" || {
    echo "ERROR: sacreBLEU not found. Please install requirements."
    exit 1
}

python3 -c "import nltk; print(f'NLTK: {nltk.__version__}')" || {
    echo "ERROR: NLTK not found. Please install requirements."
    exit 1
}

echo ""

# ===== Run Training =====
echo "========================================"
echo "Starting Model Training..."
echo "========================================"
echo ""

# Save output to log file and display to console
LOG_FILE="logs/gru_local/run_$(date +%Y%m%d_%H%M%S).log"

python3 src/main.py --config "${CONFIG}" 2>&1 | tee "${LOG_FILE}"

EXIT_CODE=${PIPESTATUS[0]}

# ===== Job Summary =====
echo ""
echo "========================================"
echo "Training Complete"
echo "========================================"
echo "Model: ${MODEL_NAME}"
echo "Exit Code: ${EXIT_CODE}"
echo "End Time: $(date)"
echo "Log saved to: ${LOG_FILE}"
echo "========================================"
echo ""

# ===== Verify Checkpoint Creation =====
CHECKPOINT_PATH="${CHECKPOINT_DIR}/unsynced_gru_test.pt"
if [ -f "${CHECKPOINT_PATH}" ]; then
    echo "✓ Checkpoint saved successfully!"
    echo "  Location: ${CHECKPOINT_PATH}"
    echo "  Size: $(du -h ${CHECKPOINT_PATH} | cut -f1)"
else
    echo "✗ WARNING: Checkpoint not found at: ${CHECKPOINT_PATH}"
    echo "  Training may have failed. Check the log file above."
fi

echo ""
echo "========================================"
echo "Results"
echo "========================================"
echo "Check WandB project: ${WANDB_PROJECT}"
echo "Compare these metrics:"
echo "  - val/metric/bleu      (NLTK sentence-level)"
echo "  - val/metric/sacrebleu (corpus-level)"
echo ""
echo "Expected: Both BLEU metrics will show the impact"
echo "          of sentence-level vs corpus-level calculation"
echo "========================================"

exit ${EXIT_CODE}
