#for seed in 1 2 3 4 5
#do
#    CUDA_VISIBLE_DEVICES=0 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-KeyCorridorS3R3-v0 --total_frames 10000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed $seed &
#    CUDA_VISIBLE_DEVICES=1 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-KeyCorridorS4R3-v0 --total_frames 10000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed $seed &
#    wait
#    CUDA_VISIBLE_DEVICES=0 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-KeyCorridorS5R3-v0 --total_frames 10000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed $seed &
#    CUDA_VISIBLE_DEVICES=1 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-KeyCorridorS6R3-v0 --total_frames 10000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed $seed &
#    wait
#done

CUDA_VISIBLE_DEVICES=0 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-1Q-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 1 &
CUDA_VISIBLE_DEVICES=1 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-1Q-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 2 &
CUDA_VISIBLE_DEVICES=2 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-1Q-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 3 &
CUDA_VISIBLE_DEVICES=3 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-1Q-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 4 &
CUDA_VISIBLE_DEVICES=4 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-2Dlhb-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 1 &
CUDA_VISIBLE_DEVICES=5 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-2Dlhb-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 2 &
CUDA_VISIBLE_DEVICES=6 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-2Dlhb-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 3 &
CUDA_VISIBLE_DEVICES=7 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-2Dlhb-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 4 &
wait

CUDA_VISIBLE_DEVICES=0 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-2Q-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 1 &
CUDA_VISIBLE_DEVICES=1 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-2Q-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 2 &
CUDA_VISIBLE_DEVICES=2 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-2Q-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 3 &
CUDA_VISIBLE_DEVICES=3 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-2Q-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 4 &
CUDA_VISIBLE_DEVICES=4 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-Full-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 1 &
CUDA_VISIBLE_DEVICES=5 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-Full-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 2 &
CUDA_VISIBLE_DEVICES=6 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-Full-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 3 &
CUDA_VISIBLE_DEVICES=7 OMP_NUM_THREADS=1 python main.py --model bebold --env MiniGrid-ObstructedMaze-Full-v0 --total_frames 40000000 --intrinsic_reward_coef 0.5 --entropy_cost 0.0005 --seed 4 &
wait