import os
          
for env,freq in zip(["cartpole", "acrobot","lunarlander"],[20,20,5]):
    for demos in [1,2,3,5,10]:
        for seed in range(10):
            # Run SPOIL
            os.system(f"python train.py agent=softq env={env} eval.demos={demos} eval.subsample_freq={freq} method.loss=value seed={seed} method.type=pdoil agent.init_temperature=1")
            # Run IQ-Learn
            os.system(f"python train.py agent=softq env={env} eval.demos={demos} eval.subsample_freq={freq} method.loss=value seed={seed} method.type=iq agent.init_temperature=1")
            # Run PPIL
            os.system(f"python train.py agent=softq env={env} eval.demos={demos} eval.subsample_freq={freq} method.loss=value seed={seed} method.type=logistic_offline agent.init_temperature=1")
            # Run BC
            os.system(f"python run_bc.py env={env} eval.demos={demos} eval.subsample_freq={freq} seed={seed} ")