export PYTHONPATH=.:$PYTHONPATH
export PYTHONPATH=$PYTHONPATH:/home/zhengyao/project/transformer_planning/implicit_q_learning

name=T-1
datasets=(hopper-medium-replay-v2)

for round in {1..5}; do
  for data in ${datasets[@]}; do
    python scripts/train.py --dataset $data --exp_name $name-$round --tag development --seed $round
    python scripts/trainprior.py --dataset $data --exp_name $name-$round
    for i in {1..20};
    do
       python scripts/plan.py --test_planner beam_prior --dataset $data --exp_name $name-$round --suffix $i --prob_threshold 0.001 --prob_weight 5e2 --rounds 1 --nb_samples 128 --beam_width 64 --n_expand 4 --horizon 15 --iql_value False
    done
  done
done

for data in ${antdatasets[@]}; do
  for round in {1..5}; do
    python plotting/read_results.py --exp_name $name-$round --dataset $data
  done

  python plotting/read_results.py --exp_name $name --dataset $data 
  #> ./$name-$data-beam-04.log
done


