import os
import argparse

# This script is designed to use multiple random seeds simultaneously in order to better observe the effects of the experiment.

parser = argparse.ArgumentParser()
parser.add_argument('--env', default="halfcheetah", type=str)
parser.add_argument('--gpu_num', default=0, type=int)
args = parser.parse_args()
env, gpu_num = args.env, args.gpu_num

for dataset in ["medium","medium-expert","medium-replay"]: # "medium","medium-expert","medium-replay"
    for seed in range(0,5):
        # Note: the combination of "--condition 'xvel'  --distributions 'categorical' " is for CEDT; the combination of "--condition 'reward'  --distributions 'deterministic' " is for DT.
        cmd = fr"python train_CEDT.py --env {env} --dataset {dataset} --gpu {gpu_num} --seed {seed} --dist_dim 30 --n_bins 31 --condition 'xvel'  --distributions 'categorical' --save_model True > ./train_record_Transformer_xvel/{env}_{dataset}_{seed}.log 2>&1 &"
        print(cmd)
        os.system(cmd)
