#!/usr/bin/env bash
# rolling_train_equities_lc.sh
# Sliding-window training for the LongConv baseline, 5 seeds per year.

# ─── Move to repo root ──────────────────────────────────────────────────────────
cd "$(dirname "$0")"/..

# Use BASE_PATH from environment or set default if not defined
BASE_PATH=${BASE_PATH:-"./"}
# Remove trailing slash if present
BASE_PATH=${BASE_PATH%/}

# ─── Tunables ───────────────────────────────────────────────────────────────────
N_SEEDS=5          # launch seeds 1…5 for every year
MAX_CONCURRENT=5   # allow up to 5 simultaneous Hydra jobs

# ─── Outer loop over rolling windows ────────────────────────────────────────────
for YEAR in {1990..2013}; do
  TRAIN_BEG=$(printf "%04d0101" "${YEAR}")
  TRAIN_END=$(printf "%04d1231" $((YEAR + 7)))
  VAL_BEG=$(printf  "%04d0101" $((YEAR + 8)))
  VAL_END=$(printf  "%04d1231" $((YEAR + 8)))
  TEST_BEG=$(printf "%04d0101" $((YEAR + 9)))
  TEST_END=$(printf "%04d1231" $((YEAR + 9)))
  VAL_YEAR=$(printf "%04d"     $((YEAR + 8)))

  echo "────────────────────────────────────────────────────────────"
  echo "YEAR ${YEAR}: Train ${TRAIN_BEG}–${TRAIN_END},   Val ${VAL_BEG}–${VAL_END},   Test ${TEST_BEG}–${TEST_END}"
  echo "────────────────────────────────────────────────────────────"

  # ─── Inner loop over seeds ────────────────────────────────────────────────────
  for SEED in $(seq 1 "$N_SEEDS"); do
    # throttle so we never exceed $MAX_CONCURRENT jobs
    while [ "$(jobs -p | wc -l)" -ge "$MAX_CONCURRENT" ]; do
      sleep 2
    done

    python -m train experiment=equities/equities_lc.yaml \
      dataset.dataset_config.train_beg_date="${TRAIN_BEG}" \
      dataset.dataset_config.train_end_date="${TRAIN_END}" \
      dataset.dataset_config.val_beg_date="${VAL_BEG}" \
      dataset.dataset_config.val_end_date="${VAL_END}" \
      dataset.dataset_config.test_beg_date="${TEST_BEG}" \
      dataset.dataset_config.test_end_date="${TEST_END}" \
      ++dataset.save_data=False \
      ++dataset.load_data=True \
      ++dataset.data_path="${BASE_PATH}/data/equities/equity_dataset_${VAL_YEAR}.npz" \
      ++train.seed="${SEED}" \
      wandb.name="${VAL_BEG}_lc_seed${SEED}" &

    # small pause to avoid Hydra timestamp clashes
    sleep 5
  done
done

# ─── Final rendez-vous ──────────────────────────────────────────────────────────
wait
echo "All sliding-window training jobs have completed."

# chmod +x rolling_train_equities_lc.sh
# ./rolling_train_equities_lc.sh