# train 
for ENV_ID in button-press door-close drawer-close window-open faucet-open; do
   for SEED in 1024 1234 2986 314159 42 ; do
       for algo in lm, ellm, t2r, oracle, lm_pr, lm_re, lm_ns; do
            python train_mw.py --env_id $ENV_ID --seed $SEED --our $algo  --train_max_steps 1_000_000> ./nohup_logs/${algo}-${ENV_ID}-${SEED}.log 2>&1 &
        done
   done
done

for ENV_ID in sweep-into, pick-place, pick-out-of-hole, sweep, push; do
    for SEED in 1024 1234 2986 314159 42 ; do
        for algo in lm, ellm, t2r, oracle, lm_pr, lm_re, lm_ns; do
            nohup python train_mw.py --env_id $ENV_ID --seed $SEED --our $algo  --train_max_steps 2_000_000> ./nohup_logs/${algo}-${ENV_ID}-${SEED}.log 2>&1 &
        done
    done
done


# generalization evaluation
python gene_mw.py
