#!/bin/bash
#SBATCH --job-name=vllm_clean_model_cards
#SBATCH --partition=boost_usr_prod      
      
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1       # 1 processo per nodo
#SBATCH --cpus-per-task=16
#SBATCH --gres=gpu:2
#SBATCH --mem=128G                      
#SBATCH --time=24:00:00
#SBATCH -o vllm_%j.log
#SBATCH -e vllm_%j.err

echo "Starting job on $(date)"
echo "Node: $SLURM_JOB_NODELIST"
echo "CPUs per task: $SLURM_CPUS_PER_TASK"
echo "GPUs requested: $SLURM_GPUS_ON_NODE"

# Carica i moduli necessari (adatta al tuo sistema)
module purge
module load gcc/12.2.0
module load cuda/12.4
module load python/3.11.7

# Attiva il tuo ambiente virtuale
source /leonardo/home/userexternal/ggramagl/prjects/CCO/.venv/bin/activate

export C_INCLUDE_PATH=/usr/include/python3.11
# Debug info GPU
# nvidia-smi

# Esegui lo script Python
python clean_model_cards.py \
    --model_cards_path "/leonardo/home/userexternal/ggramagl/prjects/CCO/self-instruct/data/filtered_models_OLD.jsonl" \
    --output_path "/leonardo/home/userexternal/ggramagl/prjects/CCO/self-instruct/data/final_models_old.jsonl" \
    --model_path "/leonardo_scratch/fast/IscrC_ConFT/gerlandogramaglia/qwen3-32b"