#!/bin/bash
#SBATCH --job-name=rule_all_i4_v6
#SBATCH --chdir=/home/users/XXXX/task-sequencing/train/rule_03_full/rule_all_i4_v6/source
#SBATCH --output=/home/users/XXXX/task-sequencing/train/rule_03_full/rule_all_i4_v6/job/%j_%a.o
#SBATCH --error=/home/users/XXXX/task-sequencing/train/rule_03_full/rule_all_i4_v6/job/%j_%a.e
#SBATCH --parsable
#SBATCH --exclude=gpu008
#SBATCH --time=4:00:00
#SBATCH --partition=shared-gpu
#SBATCH --gres=gpu:1,VramPerGpu:16G


echo JOB ID IS $SLURM_JOB_ID

module load Anaconda3
source activate pytorch
#module load GCC/11.3.0 OpenMPI/4.1.4 PyTorch/1.12.0-CUDA-11.7.0 
module load GCC/12.3.0 OpenMPI/4.1.5 PyTorch/2.1.2-CUDA-12.1.1 tensorboard/2.15.1


python -u run.py --base-dir=/home/users/XXXX/task-sequencing/train/rule_03_full --run-dir=rule_all_i4_v6 --data-dir=/home/users/XXXX/task-sequencing/data_all --train-epochs=20000 --batch-size=2048 --n-contexts=3 --model=0  --seed=4  --n-blocks=6 --rank=0 --hidden=32 --task-train 0.9 --weight-init 0.01 --lr 3e-4 --sigma-init 0.0 --n-particles 250 --n-steps 15 --grad-clip 1.0 --batch-size 512      

sacct -j $SLURM_JOB_ID --format=JobID,Start,Elapsed,NCPUS,NodeList,NTasks > /home/users/XXXX/task-sequencing/train/rule_03_full/rule_all_i4_v6/job/node.txt


