#!/bin/bash
#SBATCH --job-name=Robust_RL
#SBATCH --output=res_TQC_VAR_print2.txt
#SBATCH --error=error_cont_print2
#
#
##SBATCH --ntasks=80
#SBATCH --time=20:00:00
#SBATCH --partition=cpu_shared
#SBATCH --nodes=1



sbatch --ntasks=16  QRDQN_1_acro.sh 150_000 'QRDQN' 'Acrobot-v1' 'std_penal' 'replay5_QRDQN_acro_1_std' &
sbatch --ntasks=16  QRDQN_2_acro.sh 150_000 'QRDQN' 'Acrobot-v1' 'std_penal' 'replay5_QRDQN_acro_2_std'&
sbatch --ntasks=16  QRDQN_3_acro.sh 150_000 'QRDQN' 'Acrobot-v1' 'std_penal' 'replay5_QRDQN_acro_3_std'&
sbatch --ntasks=16  QRDQN_4_acro.sh 150_000 'QRDQN' 'Acrobot-v1' 'std_penal' 'replay5_QRDQN_acro_4_std'&
sbatch --ntasks=16  QRDQN_5_acro.sh 150_000 'QRDQN' 'Acrobot-v1' 'std_penal' 'replay5_QRDQN_acro_5_std'&
sbatch --ntasks=16  QRDQN_6_acro.sh 150_000 'QRDQN' 'Acrobot-v1' 'std_penal' 'replay5_QRDQN_acro_6_std'&
##sbatch --ntasks=16  SAC_cont.sh &
sbatch --ntasks=16  PPO_discrete_acro.sh 150_000 'PPO' 'Acrobot-v1' 'std_penal' 'replay5_PPO_acro_std'&
wait
##


