mkdir -p "logs"
suff=gpi
# suff=wo_gpi
# suff=zero
# wcoeff=20 #0.01
# seed=6
# gamma=0.9

# Figure 2 ------------------------------------------------------------------------------------------
gamma=0.0
SEED_SET="0 1 2 3 4 5 6 7 8 9"
WCOEFF_SET="0.001"
for seed in $SEED_SET; do
    for wcoeff in $WCOEFF_SET; do
        log_name=phi_learn_$wcoeff-$seed-$gamma-sfdqn_$suff-rebuttal-sfdqn-dqn-comp-eps-0.out
        python -u toy_sfdqn_new.py --seed $seed --c $wcoeff --gamma $gamma > logs/$log_name

        log_name=phi_learn_$wcoeff-$seed-$gamma-dqn_gpi-rebuttal-sfdqn-dqn-comp-eps-0.out
        python -u toy_dqn_gpi.py --seed $seed --c $wcoeff --gamma $gamma > logs/$log_name
    done
done

#to generate task 1 dqn
# seed=0
# wcoeff=0.0
# log_name=phi_learn_$wcoeff-$seed-$gamma-dqn-task1.out
# python -u toy_dqn.py --seed $seed --c $wcoeff --gamma $gamma  > logs/$log_name
#---------------------------------------------------------------------------------------------------


# Figure 4 ------------------------------------------------------------------------------------------
# SEED_SET="0 1 2 3 4 5 6 7 8 9"
# WCOEFF_SET="20 40 60 80"
# for seed in $SEED_SET; do
#     for wcoeff in $WCOEFF_SET; do
#         log_name=phi_learn_$wcoeff-$seed-$gamma-sfdqn_$suff-rebuttal-wstar-gap.out
#         python -u toy_sfdqn_new.py --seed $seed --c $wcoeff --gamma $gamma > logs/$log_name
#     done
# done

# SEED_SET="0"
# WCOEFF_SET="2.0 4.0 6.0 8.0"
# for seed in $SEED_SET; do
#     for wcoeff in $WCOEFF_SET; do
#         log_name=phi_learn_$wcoeff-$seed-$gamma-dqn-wstar-gapt.out
#         python -u toy_dqn.py --seed $seed --c $wcoeff --gamma $gamma  > logs/$log_name
#     done
# done
#-------------------------------------------------------------------------------------------------------


# Table 1 ------------------------------------------------------------------------------------------
# gamma=0.9
# SEED_SET="1 2 3 4 5 6 7 8 9"
# WCOEFF_SET="0.01 0.1 1 10" #0.01 0.1 1 10
# for seed in $SEED_SET; do
#     for wcoeff in $WCOEFF_SET; do
#         log_name=phi_learn_$wcoeff-$seed-$gamma-sfdqn_$suff-rebuttal-wstar-gpi-gap-eps-0.out
#         python -u toy_sfdqn_new.py --seed $seed --c $wcoeff --gamma $gamma > logs/$log_name
#         log_name=phi_learn_$wcoeff-$seed-$gamma-sfdqn_$suff-rebuttal-wstar-no-gpi-gap-eps-0.out
#         python -u toy_sfdqn_new_no_gpi.py --seed $seed --c $wcoeff --gamma $gamma > logs/$log_name
#     done
# done

# SEED_SET="0"
# WCOEFF_SET="0.01 0.1"
# for seed in $SEED_SET; do
#     for wcoeff in $WCOEFF_SET; do
#         log_name=phi_learn_$wcoeff-$seed-$gamma-dqn-wstar-gapt-eps-0.out
#         python -u toy_dqn.py --seed $seed --c $wcoeff --gamma $gamma  > logs/$log_name
#     done
# done
#-------------------------------------------------------------------------------------------------------

# log_name=phi_learn_$wcoeff-$seed-$gamma-dqn-w_init_opt.out
# python -u toy_dqn.py --seed $seed --c $wcoeff --gamma $gamma  > logs/$log_name

# log_name=q_bound_$wcoeff-$seed-$suff.out
# python -u toy_sfdqn_q_bound.py --seed $seed --c $wcoeff > logs/$log_name


# Figure 1
# SEED_SET="0 1 2 3 4 5 6 7 8 9"
# WCOEFF_SET="20 40 60 80"

# for seed in $SEED_SET; do
#     for wcoeff in $WCOEFF_SET; do
#         log_name=theta_bound_$wcoeff-$seed-$gamma-winit-gap.out
#         python -u toy_sfdqn_theta_bound.py --seed $seed --c $wcoeff --gamma $gamma > logs/$log_name
#     done
# done

