import os
os.system('conda activate py3')
# task_list =  ['Maze_square_random', 'Maze_U_shape','Maze_S_shape','Maze_spiral_shape']
# task_max_ep_list = [8000,6000,4000,2000]
task_list =  ['Maze_U_shape',]
task_max_ep_list = [6000,]
for i in range(len(task_list)):
    task = task_list[i]
    ep_max = task_max_ep_list[i]
    # for j in range(3):
    #     os.system('python ours_main.py --env {} --ep_max {} --train_num {}'.format(task,ep_max,j+3))

    for j in range(3):
    # j = 3
        os.system('python ours_main.py --env {} --ep_max {} --train_num {} --dense'.format(task,ep_max, j+6))

# for j in range(6):
#     os.system('python ours_main.py --env {} --ep_max {} --train_num {}'.format('Maze_S_shape',4000,j))