#!/bin/bash
#SBATCH -p scavenger-gpu                       # Partition name
#SBATCH --gres=gpu:1                            # Number of GPUs per task
#SBATCH --cpus-per-task=2                      # Number of CPU cores per task
#SBATCH --mem=40G                              # Memory per task
#SBATCH --array=1-1                            # Number of tasks to launch
#SBATCH --job-name=train                         # Job name for the array


# load one parameter called try_num
source /hpc/group/fanglab/mg585/miniconda3/etc/profile.d/conda.sh
conda activate mujoco
# read a parameter called horizon
horizon=$1

lprs=(
    # 0.1
    # 0.5
    # 1 
    5
    # 10
    # 20
    # 50
    # 100
)
# Run the Python script with the selected parameters
srun python3 train.py --max-episode-steps $horizon --lambda-pr ${lprs[$SLURM_ARRAY_TASK_ID-1]}  > h${horizon}_lpr${lprs[$SLURM_ARRAY_TASK_ID-1]}.log