#!/usr/bin/env bash
set -euo pipefail

###############################################################################
# Usage Guide:
#
# Mode A: Fresh Start
#   - MODELS: Fill in original model name or path (e.g., "Qwen/Qwen2-VL-7B-Instruct")
#   - RESUME: "false"
#   - STAGE:  "stage1"
#
# Mode B: Resume Training
#   - MODELS: Keep consistent with initial training (e.g., "Qwen/Qwen3-VL-4B-Instruct"), do not change path
#   - RESUME: "true" (Script automatically finds the latest checkpoint in saves/ and continues)
#   - STAGE:  Keep consistent (e.g., "stage1")
#
# Mode C: Further Fine-tuning
#   - MODELS: Fill in the specific absolute path of the stage 1 checkpoint (e.g., ".../checkpoint-17100")
#   - RESUME: "false" (Because it starts a new round of training, not resuming)
#   - STAGE:  "stage2" (Modify this to create a new output folder, avoiding overwrite)
#   - HCOMBOS: Suggest lowering learning rate (e.g., 1e-6)
###############################################################################

##########################################
# =========== Train Modes ===============
# multi           = Multi-task mixed (Tradition)
# multi_gf        = Multi-task mixed (GF)
# multi_ugs       = Multi-task mixed (UGS)
# multi_gskel     = Multi-task mixed (GSkel)
# multi_gskel_full = Multi-task mixed (GSkel) + Event Graph Full
# multi_gskel_understand = Multi-task mixed (GSkel) - Understand (Graph Search + Mol Graph)
# multi_gskel_generation = Multi-task mixed (GSkel) - Generation (Scene Graph + Event Graph)
# gf_interleave_reasoning = Multi-task mixed (GF) + Interleave Reasoning
# gf_interleave_sample    = Multi-task mixed (GF) + Interleave Sample
# interleave      = Simultaneously launch both Interleave tasks above
# gskel_interleave_reasoning = Multi-task mixed (GSkel) + Interleave Reasoning
# gskel_interleave_sample    = Multi-task mixed (GSkel) + Interleave Sample
# interleave_gskel = Simultaneously launch both GSkel Interleave tasks above
# interleave_gskel_only_graph_search = Simultaneously launch both GSkel Interleave Only Graph Search tasks above
# interleave_gskel_variations = Simultaneously launch 3 variations: full, no_path_retrive, no_consistency
# interleave_v2           = Simultaneously launch 3 variations: algorithm, all, consistency
# multi_interleave_full   = Multi-task mixed (Tradition) + Interleave Full
# gh              = Simultaneously launch gh_reasoning and gh_simple
# gh_only_graph_search = Simultaneously launch gh_reasoning_only_graph_search and gh_simple_only_graph_search
# gh_reasoning    = Multi-task (GSkel) + Interleave Reasoning (GH)
# gh_simple       = Multi-task (GSkel) + Interleave Simple (GH)
# gh_v1           = Simultaneously launch gh_v1_desc_reason, gh_v1_desc, gh_v1_reason, gh_v1_irrelevant_desc_plus_reason
# gh_v1_desc_reason
# gh_v1_desc
# gh_v1_reason
# gh_v1_irrelevant_desc_plus_reason
# gh_v1_full      = Simultaneously launch gh_v1_desc_reason_full, gh_v1_desc_full, gh_v1_reason_full, gh_v1_irrelevant_desc_plus_reason_full
# gh_v1_desc_reason_full
# gh_v1_desc_full
# gh_v1_reason_full
# gh_v1_irrelevant_desc_plus_reason_full
# gh_tag          = Simultaneously launch simple_graph_tag, simple_think_tag, reasoning_graph_tag, reasoning_think_tag
# simple_graph_tag
# simple_think_tag
# reasoning_graph_tag
# reasoning_think_tag
# single          = Single task (Tradition)
# single_gf       = Single task (GF)
# single_gskel    = Single task (GSkel)
# multi_single    = One model launches N single tasks (Tradition)
# multi_single_gf = One model launches N single tasks (GF)
# multi_single_gskel = One model launches N single tasks (GSkel)

##########################################

TRAIN_MODE="multi_interleave_full"        
SINGLE_TASK="none"
STAGE="stage1" # Resume needs to point to original stage
TASK_LIST=("scene_graph" "graph_search" "mol_graph" "event_graph")

##########################################
# ======== Resume or Fresh ==============
##########################################
# Modify here: if resuming training, change to "true"
RESUME="false" 

SBATCH_FILE="fine_tune_multi_task.sbatch"

##########################################
# ========= Model Arrays =========
##########################################
MODELS=(
  # YOUR MODEL
)
TEMPLATES=(
  # MODEL TEMPLATE PATHS
)
DS_CONFIGS=(
  "examples/deepspeed/ds_z3_config.json"
  # "examples/deepspeed/ds_z3_config.json"
)
PARTITIONS=(

)
NGPUS=(

)

##########################################
# ========= W&B Project Automatic Switching =========
##########################################
if [[ "${TRAIN_MODE}" == "multi" ]]; then
    WANDB_PROJECT="GraphAGI_Multi"
elif [[ "${TRAIN_MODE}" == "multi_ugs" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_UGS"
elif [[ "${TRAIN_MODE}" == "multi_gf" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_GF"
elif [[ "${TRAIN_MODE}" == "multi_gskel" ]] || [[ "${TRAIN_MODE}" == "multi_gskel_full" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_GSkel"
elif [[ "${TRAIN_MODE}" == "multi_gskel_understand" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_GSkel_Understand"
elif [[ "${TRAIN_MODE}" == "multi_gskel_generation" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_GSkel_Generation"
elif [[ "${TRAIN_MODE}" == "gf_interleave_reasoning" ]] || [[ "${TRAIN_MODE}" == "gf_interleave_sample" ]] || [[ "${TRAIN_MODE}" == "interleave" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_GF_Interleave"
elif [[ "${TRAIN_MODE}" == "multi_interleave_full" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_Interleave"
elif [[ "${TRAIN_MODE}" == "gskel_interleave_reasoning" ]] || [[ "${TRAIN_MODE}" == "gskel_interleave_sample" ]] || [[ "${TRAIN_MODE}" == "interleave_gskel" ]] || [[ "${TRAIN_MODE}" == "interleave_gskel_only_graph_search" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_GSkel_Interleave"
elif [[ "${TRAIN_MODE}" == "multi_gskel_interleave_full" ]] || [[ "${TRAIN_MODE}" == "multi_gskel_interleave_no_path_retrive" ]] || [[ "${TRAIN_MODE}" == "multi_gskel_interleave_no_consistency" ]] || [[ "${TRAIN_MODE}" == "interleave_gskel_variations" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_GSkel_Interleave_Variations"
elif [[ "${TRAIN_MODE}" == "interleave_v2" ]] || [[ "${TRAIN_MODE}" == "interleave_v2_algorithm" ]] || [[ "${TRAIN_MODE}" == "interleave_v2_all" ]] || [[ "${TRAIN_MODE}" == "interleave_v2_consistency" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_GSkel_Interleave_V2"
elif [[ "${TRAIN_MODE}" == "gh_reasoning" ]] || [[ "${TRAIN_MODE}" == "gh_simple" ]] || [[ "${TRAIN_MODE}" == "gh" ]] || [[ "${TRAIN_MODE}" == "gh_only_graph_search" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_GH"
elif [[ "${TRAIN_MODE}" == "gh_v1" ]] || [[ "${TRAIN_MODE}" == "gh_v1_desc_reason" ]] || [[ "${TRAIN_MODE}" == "gh_v1_desc" ]] || [[ "${TRAIN_MODE}" == "gh_v1_reason" ]] || [[ "${TRAIN_MODE}" == "gh_v1_irrelevant_desc_plus_reason" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_GH_v1"
elif [[ "${TRAIN_MODE}" == "gh_v1_full" ]] || [[ "${TRAIN_MODE}" == "gh_v1_desc_reason_full" ]] || [[ "${TRAIN_MODE}" == "gh_v1_desc_full" ]] || [[ "${TRAIN_MODE}" == "gh_v1_reason_full" ]] || [[ "${TRAIN_MODE}" == "gh_v1_irrelevant_desc_plus_reason_full" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_GH_v1_Full"
elif [[ "${TRAIN_MODE}" == "gh_tag" ]] || [[ "${TRAIN_MODE}" == "simple_graph_tag" ]] || [[ "${TRAIN_MODE}" == "simple_think_tag" ]] || [[ "${TRAIN_MODE}" == "reasoning_graph_tag" ]] || [[ "${TRAIN_MODE}" == "reasoning_think_tag" ]]; then
    WANDB_PROJECT="GraphAGI_Multi_GH_Tag"
elif [[ "${TRAIN_MODE}" == "multi_single_gf" ]] || [[ "${TRAIN_MODE}" == "single_gf" ]]; then
    WANDB_PROJECT="GraphAGI_Single_GF"
elif [[ "${TRAIN_MODE}" == "multi_single_gskel" ]] || [[ "${TRAIN_MODE}" == "single_gskel" ]]; then
    WANDB_PROJECT="GraphAGI_Single_GSkel"
else
    WANDB_PROJECT="GraphAGI_Single"
fi


##########################################
# ========= Hyperparameter Sweep =========
##########################################
if [[ "${RESUME}" == "true" ]]; then
    # Resume: Must keep original parameters to match optimizer state
    HCOMBOS=("false 8e-6 4 0.10 cosine")
elif [[ "${STAGE}" == "stage2" ]]; then
    # Stage 2 fine-tuning: Suggest lowering learning rate
    HCOMBOS=("false 1e-6 2 0.05 cosine")
else
    # Fresh training (stage1)
    HCOMBOS=("false 8e-6 2 0.10 cosine")
fi


##########################################

n=${#MODELS[@]}

for ((i=0; i<n; i++)); do
  MODEL_NAME="${MODELS[i]}"
  TEMPLATE="${TEMPLATES[i]}"
  DS_CONFIG="${DS_CONFIGS[i]}"
  PARTITION="${PARTITIONS[i]}"
  NGPU="${NGPUS[i]}"
  SAN_MODEL="${MODEL_NAME##*/}"
  SM_LC="${SAN_MODEL,,}"   # Convert to lowercase

  if [[ "${SM_LC}" == *"2b"* ]]; then
      ACCUM_STEPS=32
  elif [[ "${SM_LC}" == *"4b"* ]]; then
      ACCUM_STEPS=8
  elif [[ "${SM_LC}" == *"7b"* ]]; then
      ACCUM_STEPS=16
  else
      ACCUM_STEPS=8
  fi

  for HC in "${HCOMBOS[@]}"; do
    set -- ${HC}
    VT="${1}"
    LR="${2}"
    EPOCH="${3}"
    WR="${4}"
    LR_TYPE="${5}"

    # Define common export list
    EXPORT_VARS="ALL,TRAIN_MODE=${TRAIN_MODE},SINGLE_TASK=${SINGLE_TASK},MODEL_NAME=${MODEL_NAME},TEMPLATE=${TEMPLATE},DS_CONFIG=${DS_CONFIG},PARTITION=${PARTITION},WANDB_ENTITY=${WANDB_ENTITY},WANDB_PROJECT=${WANDB_PROJECT},NGPU=${NGPU},VT=${VT},LR=${LR},EPOCH=${EPOCH},WR=${WR},LR_TYPE=${LR_TYPE},ACCUM_STEPS=${ACCUM_STEPS},RESUME=${RESUME},STAGE=${STAGE}"

    ######################################
    # ============ multi ================
    ######################################
    if [[ "${TRAIN_MODE}" == "multi" ]]; then
      JOB_NAME="multi_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ============ multi_gf =============
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_gf" ]]; then
      JOB_NAME="multi_gf_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ============ multi_gskel ==========
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_gskel" ]]; then
      JOB_NAME="multi_gskel_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ============ multi_gskel_full =====
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_gskel_full" ]]; then
      JOB_NAME="multi_gskel_full_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== multi_gskel_understand =====
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_gskel_understand" ]]; then
      JOB_NAME="multi_gskel_und_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== multi_gskel_generation =====
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_gskel_generation" ]]; then
      JOB_NAME="multi_gskel_gen_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ========= multi_ugs ===============
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_ugs" ]]; then
      JOB_NAME="multi_ugs_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ========= interleave ==============
    ######################################
    if [[ "${TRAIN_MODE}" == "interleave" ]]; then
      INTERLEAVE_MODES=("gf_interleave_reasoning" "gf_interleave_sample")
      for I_MODE in "${INTERLEAVE_MODES[@]}"; do
        if [[ "${I_MODE}" == "gf_interleave_reasoning" ]]; then
            SUFFIX="reasoning"
        else
            SUFFIX="sample"
        fi
        JOB_NAME="gf_${SUFFIX}_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
        # Override TRAIN_MODE
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=${I_MODE},SINGLE_TASK=none" "${SBATCH_FILE}"
        sleep 2
      done
      continue
    fi

    ######################################
    # ========= interleave_gskel ========
    ######################################
    if [[ "${TRAIN_MODE}" == "interleave_gskel" ]]; then
      INTERLEAVE_MODES=("gskel_interleave_reasoning" "gskel_interleave_sample")
      for I_MODE in "${INTERLEAVE_MODES[@]}"; do
        if [[ "${I_MODE}" == "gskel_interleave_reasoning" ]]; then
            SUFFIX="reasoning"
        else
            SUFFIX="sample"
        fi
        JOB_NAME="gskel_${SUFFIX}_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
        # Override TRAIN_MODE
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=${I_MODE},SINGLE_TASK=none" "${SBATCH_FILE}"
        sleep 2
      done
      continue
    fi

    ######################################
    # ========= interleave_gskel_only_graph_search ========
    ######################################
    if [[ "${TRAIN_MODE}" == "interleave_gskel_only_graph_search" ]]; then
      INTERLEAVE_MODES=("gskel_interleave_reasoning_only_graph_search" "gskel_interleave_sample_only_graph_search")
      for I_MODE in "${INTERLEAVE_MODES[@]}"; do
        if [[ "${I_MODE}" == "gskel_interleave_reasoning_only_graph_search" ]]; then
            SUFFIX="reasoning_only_gs"
        else
            SUFFIX="sample_only_gs"
        fi
        JOB_NAME="gskel_${SUFFIX}_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
        # Override TRAIN_MODE
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=${I_MODE},SINGLE_TASK=none" "${SBATCH_FILE}"
        sleep 2
      done
      continue
    fi

    ######################################
    # ========= interleave_gskel_variations ========
    ######################################
    if [[ "${TRAIN_MODE}" == "interleave_gskel_variations" ]]; then
      VAR_MODES=("multi_gskel_interleave_full" "multi_gskel_interleave_no_path_retrive" "multi_gskel_interleave_no_consistency")
      for V_MODE in "${VAR_MODES[@]}"; do
        if [[ "${V_MODE}" == "multi_gskel_interleave_full" ]]; then
            SUFFIX="full"
        elif [[ "${V_MODE}" == "multi_gskel_interleave_no_path_retrive" ]]; then
            SUFFIX="no_path"
        else
            SUFFIX="no_cons"
        fi
        JOB_NAME="gskel_${SUFFIX}_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
        # Override TRAIN_MODE
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=${V_MODE},SINGLE_TASK=none" "${SBATCH_FILE}"
        sleep 2
      done
      continue
    fi

    ######################################
    # ========= interleave_v2 ===========
    ######################################
    if [[ "${TRAIN_MODE}" == "interleave_v2" ]]; then
      V2_MODES=("interleave_v2_algorithm" "interleave_v2_all" "interleave_v2_consistency")
      for V_MODE in "${V2_MODES[@]}"; do
        if [[ "${V_MODE}" == "interleave_v2_algorithm" ]]; then
            SUFFIX="v2_algo"
        elif [[ "${V_MODE}" == "interleave_v2_all" ]]; then
            SUFFIX="v2_all"
        else
            SUFFIX="v2_cons"
        fi
        JOB_NAME="gskel_${SUFFIX}_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=${V_MODE},SINGLE_TASK=none" "${SBATCH_FILE}"
        sleep 2
      done
      continue
    fi

    ######################################
    # ====== gf_interleave_reasoning ====
    ######################################
    if [[ "${TRAIN_MODE}" == "gf_interleave_reasoning" ]]; then
      JOB_NAME="gf_reasoning_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== gf_interleave_sample =======
    ######################################
    if [[ "${TRAIN_MODE}" == "gf_interleave_sample" ]]; then
      JOB_NAME="gf_sample_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== gskel_interleave_reasoning =
    ######################################
    if [[ "${TRAIN_MODE}" == "gskel_interleave_reasoning" ]]; then
      JOB_NAME="gskel_reasoning_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== gskel_interleave_sample ====
    ######################################
    if [[ "${TRAIN_MODE}" == "gskel_interleave_sample" ]]; then
      JOB_NAME="gskel_sample_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== gskel_interleave_reasoning_only_graph_search =
    ######################################
    if [[ "${TRAIN_MODE}" == "gskel_interleave_reasoning_only_graph_search" ]]; then
      JOB_NAME="gskel_reasoning_only_gs_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== gskel_interleave_sample_only_graph_search ====
    ######################################
    if [[ "${TRAIN_MODE}" == "gskel_interleave_sample_only_graph_search" ]]; then
      JOB_NAME="gskel_sample_only_gs_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== multi_gskel_interleave_full =
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_gskel_interleave_full" ]]; then
      JOB_NAME="gskel_full_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== multi_gskel_interleave_no_path_retrive =
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_gskel_interleave_no_path_retrive" ]]; then
      JOB_NAME="gskel_no_path_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== multi_gskel_interleave_no_consistency =
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_gskel_interleave_no_consistency" ]]; then
      JOB_NAME="gskel_no_cons_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== multi_interleave_full ======
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_interleave_full" ]]; then
      JOB_NAME="multi_il_full_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ========= gh ======================
    ######################################
    if [[ "${TRAIN_MODE}" == "gh" ]]; then
      GH_MODES=("gh_reasoning" "gh_simple")
      for G_MODE in "${GH_MODES[@]}"; do
        if [[ "${G_MODE}" == "gh_reasoning" ]]; then
            SUFFIX="reasoning"
        else
            SUFFIX="simple"
        fi
        JOB_NAME="gh_${SUFFIX}_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=${G_MODE},SINGLE_TASK=none" "${SBATCH_FILE}"
        sleep 2
      done
      continue
    fi

    ######################################
    # ========= gh_only_graph_search ======================
    ######################################
    if [[ "${TRAIN_MODE}" == "gh_only_graph_search" ]]; then
      GH_MODES=("gh_reasoning_only_graph_search" "gh_simple_only_graph_search")
      for G_MODE in "${GH_MODES[@]}"; do
        if [[ "${G_MODE}" == "gh_reasoning_only_graph_search" ]]; then
            SUFFIX="reasoning_only_gs"
        else
            SUFFIX="simple_only_gs"
        fi
        JOB_NAME="gh_${SUFFIX}_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=${G_MODE},SINGLE_TASK=none" "${SBATCH_FILE}"
        sleep 2
      done
      continue
    fi

    ######################################
    # ====== gh_reasoning ===============
    ######################################
    if [[ "${TRAIN_MODE}" == "gh_reasoning" ]]; then
      JOB_NAME="gh_reasoning_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== gh_simple ==================
    ######################################
    if [[ "${TRAIN_MODE}" == "gh_simple" ]]; then
      JOB_NAME="gh_simple_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== gh_reasoning_only_graph_search ===============
    ######################################
    if [[ "${TRAIN_MODE}" == "gh_reasoning_only_graph_search" ]]; then
      JOB_NAME="gh_reasoning_only_gs_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== gh_simple_only_graph_search ==================
    ######################################
    if [[ "${TRAIN_MODE}" == "gh_simple_only_graph_search" ]]; then
      JOB_NAME="gh_simple_only_gs_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ========= gh_v1 ===================
    ######################################
    if [[ "${TRAIN_MODE}" == "gh_v1" ]]; then
      GH_V1_MODES=("gh_v1_desc_reason" "gh_v1_desc" "gh_v1_reason" "gh_v1_irrelevant_desc_plus_reason")
      for G_MODE in "${GH_V1_MODES[@]}"; do
        JOB_NAME="${G_MODE}_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=${G_MODE},SINGLE_TASK=none" "${SBATCH_FILE}"
        sleep 2
      done
      continue
    fi

    ######################################
    # ====== gh_v1 individual modes =====
    ######################################
    if [[ "${TRAIN_MODE}" == "gh_v1_desc_reason" ]]; then
      JOB_NAME="gh_v1_desc_reason_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    if [[ "${TRAIN_MODE}" == "gh_v1_desc" ]]; then
      JOB_NAME="gh_v1_desc_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    if [[ "${TRAIN_MODE}" == "gh_v1_reason" ]]; then
      JOB_NAME="gh_v1_reason_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    if [[ "${TRAIN_MODE}" == "gh_v1_irrelevant_desc_plus_reason" ]]; then
      JOB_NAME="gh_v1_irrelevant_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ========= gh_v1_full ===================
    ######################################
    if [[ "${TRAIN_MODE}" == "gh_v1_full" ]]; then
      GH_V1_FULL_MODES=("gh_v1_desc_reason_full" "gh_v1_desc_full" "gh_v1_reason_full" "gh_v1_irrelevant_desc_plus_reason_full")
      for G_MODE in "${GH_V1_FULL_MODES[@]}"; do
        JOB_NAME="${G_MODE}_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=${G_MODE},SINGLE_TASK=none" "${SBATCH_FILE}"
        sleep 2
      done
      continue
    fi

    ######################################
    # ====== gh_v1_full individual modes =====
    ######################################
    if [[ "${TRAIN_MODE}" == "gh_v1_desc_reason_full" ]]; then
      JOB_NAME="gh_v1_dec_rea_ful_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    if [[ "${TRAIN_MODE}" == "gh_v1_desc_full" ]]; then
      JOB_NAME="gh_v1_desc_ful_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    if [[ "${TRAIN_MODE}" == "gh_v1_reason_full" ]]; then
      JOB_NAME="gh_v1_reason_ful_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    if [[ "${TRAIN_MODE}" == "gh_v1_irrelevant_desc_plus_reason_full" ]]; then
      JOB_NAME="gh_v1_irrel_ful_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ========= gh_tag ==================
    ######################################
    if [[ "${TRAIN_MODE}" == "gh_tag" ]]; then
      TAG_MODES=("simple_graph_tag" "simple_think_tag" "reasoning_graph_tag" "reasoning_think_tag")
      for T_MODE in "${TAG_MODES[@]}"; do
        JOB_NAME="${T_MODE}_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=${T_MODE},SINGLE_TASK=none" "${SBATCH_FILE}"
        sleep 2
      done
      continue
    fi

    ######################################
    # ====== simple_graph_tag ===========
    ######################################
    if [[ "${TRAIN_MODE}" == "simple_graph_tag" ]]; then
      JOB_NAME="simple_graph_tag_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== simple_think_tag ===========
    ######################################
    if [[ "${TRAIN_MODE}" == "simple_think_tag" ]]; then
      JOB_NAME="simple_think_tag_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== reasoning_graph_tag ========
    ######################################
    if [[ "${TRAIN_MODE}" == "reasoning_graph_tag" ]]; then
      JOB_NAME="reasoning_graph_tag_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ====== reasoning_think_tag ========
    ######################################
    if [[ "${TRAIN_MODE}" == "reasoning_think_tag" ]]; then
      JOB_NAME="reasoning_think_tag_${SAN_MODEL}_vt${VT}_lr${LR}_ep${EPOCH}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=none" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ============ single ===============
    ######################################
    if [[ "${TRAIN_MODE}" == "single" ]]; then
      JOB_NAME="single_${SINGLE_TASK}_${SAN_MODEL}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=${SINGLE_TASK}" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ============ single_gf ============
    ######################################
    if [[ "${TRAIN_MODE}" == "single_gf" ]]; then
      JOB_NAME="single_gf_${SINGLE_TASK}_${SAN_MODEL}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=${SINGLE_TASK}" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ============ single_gskel =========
    ######################################
    if [[ "${TRAIN_MODE}" == "single_gskel" ]]; then
      JOB_NAME="single_gskel_${SINGLE_TASK}_${SAN_MODEL}"
      sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},SINGLE_TASK=${SINGLE_TASK}" "${SBATCH_FILE}"
      sleep 2
      continue
    fi

    ######################################
    # ========= multi_single ============
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_single" ]]; then
      for TASK in "${TASK_LIST[@]}"; do
        JOB_NAME="single_${TASK}_${SAN_MODEL}"
        # Note: here we need to override SINGLE_TASK
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=single,SINGLE_TASK=${TASK}" "${SBATCH_FILE}"
        sleep 2
      done
    fi

    ######################################
    # ======= multi_single_gf ===========
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_single_gf" ]]; then
      for TASK in "${TASK_LIST[@]}"; do
        JOB_NAME="single_gf_${TASK}_${SAN_MODEL}"
        # Override TRAIN_MODE to single_gf
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=single_gf,SINGLE_TASK=${TASK}" "${SBATCH_FILE}"
        sleep 2
      done
    fi

    ######################################
    # ======= multi_single_gskel ========
    ######################################
    if [[ "${TRAIN_MODE}" == "multi_single_gskel" ]]; then
      # Launch fine-tuning job for each single task in the task list
      # Stage 1 job name is usually short (contains only original model name)
      # Stage 2 job name is longer (contains full Checkpoint folder name)
      for TASK in "${TASK_LIST[@]}"; do
        JOB_NAME="single_gskel_${TASK}_${SAN_MODEL}"
        # Override TRAIN_MODE to single_gskel
        sbatch -J "${JOB_NAME}" -p "${PARTITION}" --gres=gpu:${NGPU} --time="${TIME_LIMIT}" --export="${EXPORT_VARS},TRAIN_MODE=single_gskel,SINGLE_TASK=${TASK}" "${SBATCH_FILE}"
        sleep 2
      done
    fi

  done
done