#!/bin/bash
#SBATCH -J steeringJob
#SBATCH -c 16
#SBATCH --mem=256G
#SBATCH -p h100
#SBATCH --gres=gpu:8
#SBATCH --tmp=50G
#SBATCH --mail-type=ALL

set -euo pipefail

CODE_ROOT="/workspace/"
EXP_ROOT="/workspace/data"  # root for all outputs
export PYTHONPATH="$CODE_ROOT${PYTHONPATH:+:$PYTHONPATH}"
export PYTORCH_CUDA_ALLOC_CONF="expandable_segments:True"

SEEDS=(4)
MODELS=(
  openai-community/gpt2
  google/gemma-3-1b-it
  Qwen/Qwen3-8B
)
CONCEPTS=(joy evil depression)
MODEL_GENERATING_CONCEPT="google/gemma-3-12b-it"
CONTEXTS_FILE="${CODE_ROOT}/contexts_modified.jsonl"         
EVAL_PARQUET="/workspace/fineweb_eval_parquet/sample/10BT/000_00000.parquet" 

mkdir -p "${EXP_ROOT}"

for SEED in "${SEEDS[@]}"; do
  RUN_DIR="${EXP_ROOT}/run_seed${SEED}"
  PROMPTS_DIR="${RUN_DIR}/prompts"
  STEERING_DIR="${RUN_DIR}/steering_vectors"
  PLOT_DIR="${RUN_DIR}/plot_data"
  MARGIN_DIR="${RUN_DIR}/margins"
  XENT_DIR="${RUN_DIR}/cross_entropy"
  MMLU_DIR="${RUN_DIR}/mmlu"
  BEHAVIOUR_DIR="${RUN_DIR}/behaviour_data"

  mkdir -p "${PROMPTS_DIR}" "${STEERING_DIR}" "${PLOT_DIR}" "${MARGIN_DIR}" "${XENT_DIR}" "${MMLU_DIR}"

  python3 "${CODE_ROOT}/generate_prompts.py" \
    --model_generating_concept "${MODEL_GENERATING_CONCEPT}" \
    --models "${MODELS[@]}" \
    --concepts "${CONCEPTS[@]}" \
    --out_dir "${PROMPTS_DIR}" \
    --seed "${SEED}"

  python3 "${CODE_ROOT}/generate_steering_vectors.py" \
    --models "${MODELS[@]}" \
    --in_dir "${PROMPTS_DIR}" \
    --save_dir "${STEERING_DIR}" \
    --seed "${SEED}"

  python3 "${CODE_ROOT}/generate_plot_data.py" \
    --models "${MODELS[@]}" \
    --steer_dir "${STEERING_DIR}" \
    --contexts_file "${CONTEXTS_FILE}" \
    --out_dir "${PLOT_DIR}" \
    --seed "${SEED}"
    --layers 3




done
