#!/bin/bash"
# env_name="MiniGrid-Reacher"
# env_name="MiniGrid-Reacher-extra-good"
# env_name="MiniGrid-Reacher-noisy"
# env_name="MDPtakeball"
env_name="MiniGrid-Reacher-MDP"
# env_name="hopper"
# env_name="ant"
# env_name="walker2d"

# dataset="expert"
# dataset="medium-expert"
# dataset="medium-replay"
# dataset="full-replay"
# dataset="medium"
# dataset="random"
codebook=-1
seeds=(0)
k_values=(8)
codebook=16
rule_based_dataset_files=(
    "datasets/rule_based/MiniGrid-Reacher-MDP/balanced_20000.pkl"
    "datasets/rule_based/MiniGrid-Reacher-MDP/rightfirst_20000.pkl"
    "datasets/rule_based/MiniGrid-Reacher-MDP/downfirst_20000.pkl"
    "datasets/rule_based/MiniGrid-Reacher-MDP/zigzag1_20000.pkl"
    "datasets/rule_based/MiniGrid-Reacher-MDP/zigzag2_20000.pkl"
    # "datasets/rule_based/MiniGrid-Reacher-MDP/balanced_8000.pkl"
    # "datasets/rule_based/MiniGrid-Reacher-MDP/rightfirst_8000.pkl"
    # "datasets/rule_based/MiniGrid-Reacher-MDP/downfirst_8000.pkl"
    # "datasets/rule_based/MiniGrid-Reacher-MDP/zigzag1_8000.pkl"
    # "datasets/rule_based/MiniGrid-Reacher-MDP/zigzag2_8000.pkl"
    # "datasets/rule_based/MiniGrid-Reacher-MDP/balanced_2000.pkl"
    # "datasets/rule_based/MiniGrid-Reacher-MDP/rightfirst_2000.pkl"
    # "datasets/rule_based/MiniGrid-Reacher-MDP/downfirst_2000.pkl"
    # "datasets/rule_based/MiniGrid-Reacher-MDP/zigzag1_2000.pkl"
    # "datasets/rule_based/MiniGrid-Reacher-MDP/zigzag2_2000.pkl"
    # "datasets/rule_based/MDPtakeball/fixed_0_20000.pkl"
    # "datasets/rule_based/MDPtakeball/fixed_1_20000.pkl"
    # "datasets/rule_based/MDPtakeball/fixed_2_20000.pkl"
    # "datasets/rule_based/MDPtakeball/fixed_3_20000.pkl"
)

mkdir logs

# set -x
SELECTED_GPU=$(python scripts/select_gpu.py)
echo "Selected GPU: $SELECTED_GPU"
for seed in "${seeds[@]}"; do
    for k in "${k_values[@]}"; do
        echo "Running VAE + Kmeans with k=$k, seed=$seed"
        # CUDA_VISIBLE_DEVICES=$SELECTED_GPU python algos/VAE_kmeans_all.py >logs/$seed-$k-out.txt 2>logs/$seed-$k-err.txt \
        CUDA_VISIBLE_DEVICES=$SELECTED_GPU python algos/VAE_kmeans.py \
            --env "$env_name" \
            --seed "$seed" \
            --project "0128VAE_${env_name}" \
            --max_updates 400 \
            --rule_based_dataset_files "${rule_based_dataset_files[@]}"\
            --learning_rate 2e-4\
            --vqvae_alpha 100\
            --k "$k"\
            --vqvae_codebook "$codebook"\
            --algo "vqvae"\
            # --algo "vqvae_gumble_softmax" --batch_size 1024\
            # --true_k_available False\

    done
done
# echo "Done"
# python scripts/make_sheet.py ${#seeds[@]} ${#k_values[@]} ${seeds[@]} ${k_values[@]}