# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/large/gray_decode/gray_decode_gpt2_digits=100_bs=128 \
#     --checkpoint_id 15640 \
#     --dataset_path /mnt/nfs/data/large/gray_decode/gray_decode_n=100/data.test \
#     --visualize_attention

## ReLU
python3 src/evaluation_gpt.py \
    --model_path /mnt/nfs/results/small/relu/relu_gpt2_digits=20_bs=128_oneperm \
    --checkpoint_id 7820 \
    --dataset_path /mnt/nfs/data/small/relu/n=20/data-one.test \
    --visualize_attention

python3 src/evaluation_gpt.py \
    --model_path /mnt/nfs/results/small/relu/relu_gpt2_digits=20_bs=128_randperm \
    --checkpoint_id 7820 \
    --dataset_path /mnt/nfs/data/small/relu/n=20/data-rand.test \
    --visualize_attention

# ## ReLU
# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/relu/relu_gpt2_digits=50_bs=128 \
#     --checkpoint_id 7820 \
#     --dataset_path /mnt/nfs/data/small/relu/n=50/data.test \
#     --visualize_attention \
#     --target_input_text "5 6 -9 8 7 6 6 9 9 8 -4 5 1 6 7 -3 -6 -3 -2 4 1 0 4 0 1 4 8 7 7 5 5 -8 7 -1 2 9 5 -4 9 9 -1 5 2 0 -7 9 3 4 8 4"

# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/relu/relu_gpt2_digits=50_bs=128_inverse \
#     --checkpoint_id 7820 \
#     --dataset_path /mnt/nfs/data/small/relu/n=50/data-inv.test \
#     --visualize_attention

# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/relu/relu_gpt2_digits=20_bs=128 \
#     --checkpoint_id 15640 \
#     --dataset_path /mnt/nfs/data/small/relu/n=20/data.test \
#     --visualize_attention 

# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/relu/relu_gpt2_digits=20_bs=128_inverse \
#     --checkpoint_id 15640 \
#     --dataset_path /mnt/nfs/data/small/relu/n=20/data-inv.test \
#     --visualize_attention 


## Square
# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/square/square_gpt2_digits=50_bs=128 \
#     --checkpoint_id 782 \
#     --dataset_path /mnt/nfs/data/small/square/n=50/data.test \
#     --visualize_attention


# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/square/square_gpt2_digits=50_bs=128_inverse \
#     --checkpoint_id 782 \
#     --dataset_path /mnt/nfs/data/small/square/n=50/data-inv.test \
#     --visualize_attention

# ## Square mod 10
# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/square_mod10/square_gpt2_mod10_digits=50_bs=128 \
#     --checkpoint_id 15640 \
#     --dataset_path /mnt/nfs/data/small/square_mod10/n=50/data.test \
#     --visualize_attention

# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/square_mod10/square_gpt2_mod10_digits=50_bs=128_inverse \
#     --checkpoint_id 15640 \
#     --dataset_path /mnt/nfs/data/small/square_mod10/n=50/data-inv.test \
#     --visualize_attention

# ## Square mod 19
# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/square_mod19/square_gpt2_mod19_digits=20_bs=128 \
#     --checkpoint_id 1564 \
#     --dataset_path /mnt/nfs/data/small/square_mod19/n=20/data.test \
#     --visualize_attention \
#     --target_input_text "3 6 -9 1 7 0 -7 7 -5 0 -2 6 -1 -9 -6 -7 0 2 7 -1"

# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/square_mod19/square_gpt2_mod19_digits=20_bs=128_inverse \
#     --checkpoint_id 1564 \
#     --dataset_path /mnt/nfs/data/small/square_mod19/n=20/data-inv.test \
#     --visualize_attention \
#     --target_input_text "3 6 -9 1 7 0 -7 7 -5 0 -2 6 -1 -9 -6 -7 0 2 7 -1"

# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/square_mod19/square_gpt2_mod19_digits=50_bs=128 \
#     --checkpoint_id 1564 \
#     --dataset_path /mnt/nfs/data/small/square_mod19/n=50/data.test \
#     --visualize_attention \
#     --target_input_text "1 9 8 3 -1 -6 3 5 9 -1 -6 -4 -1 -6 -2 -8 3 1 6 5 4 -4 -7 -1 4 8 -8 -9 0 3 -9 -6 -5 1 2 -6 9 3 7 -8 1 5 1 4 -6 -4 -6 6 -7 6"

# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/square_mod19/square_gpt2_mod19_digits=50_bs=128_inverse \
#     --checkpoint_id 1564 \
#     --dataset_path /mnt/nfs/data/small/square_mod19/n=50/data-inv.test \
#     --visualize_attention \
#     --target_input_text "1 9 8 3 -1 -6 3 5 9 -1 -6 -4 -1 -6 -2 -8 3 1 6 5 4 -4 -7 -1 4 8 -8 -9 0 3 -9 -6 -5 1 2 -6 9 3 7 -8 1 5 1 4 -6 -4 -6 6 -7 6"

# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/square_mod19/square_gpt2_mod19_L=6_digits=50_bs=128 \
#     --checkpoint_id 1564 \
#     --dataset_path /mnt/nfs/data/small/square_mod19/n=50/data.test \
#     --visualize_attention 
# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/square_mod19/square_gpt2_mod19_L=6_digits=50_bs=128_inverse \
#     --checkpoint_id 1564 \
#     --dataset_path /mnt/nfs/data/small/square_mod19/n=50/data-inv.test \
#     --visualize_attention

# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/square_mod19/square_gpt2_mod19_digits=200_bs=128 \
#     --checkpoint_id 1564 \
#     --dataset_path /mnt/nfs/data/small/square_mod19/n=200/data.test \
#     --visualize_attention 
# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/square_mod19/square_gpt2_mod19_digits=200_bs=128_inverse \
#     --checkpoint_id 1564 \
#     --dataset_path /mnt/nfs/data/small/square_mod19/n=200/data-inv.test \
#     --visualize_attention

# ## max-min
# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/max_min/max_min_gpt2_digits=20_V=100_bs=128 \
#     --checkpoint_id 31280 \
#     --dataset_path /mnt/nfs/data/small/max_min/n=20_V=100/data.test \
#     --visualize_attention 
# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/max_min/max_min_gpt2_digits=20_V=100_bs=128_inverse \
#     --checkpoint_id 31280 \
#     --dataset_path /mnt/nfs/data/small/max_min/n=20_V=100/data-inv.test \
#     --visualize_attention

## index
# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/index/index_gpt2_longlearning_L=6_digits=13_m=8_bs=128 \
#     --checkpoint_id 31280 \
#     --dataset_path /mnt/nfs/data/small/index/n=13_m=8/data.test \
#     --visualize_attention 

# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/index/index_gpt2_longlearning_L=6_digits=13_m=8_bs=128_inverse \
#     --checkpoint_id 31280 \
#     --dataset_path /mnt/nfs/data/small/index/n=13_m=8/data-inv.test \
#     --visualize_attention

# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/index/index_gpt2_longlearning_L=6_digits=13_m=8_bs=128 \
#     --checkpoint_id 15640 \
#     --dataset_path /mnt/nfs/data/small/index/n=13_m=8/data.test \
#     --visualize_attention 

# python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/index/index_gpt2_longlearning_L=6_digits=13_m=8_bs=128_inverse \
#     --checkpoint_id 15640 \
#     --dataset_path /mnt/nfs/data/small/index/n=13_m=8/data-inv.test \
#     --visualize_attention

# ## RELU oneperm randperm
# CUDA_VISIBLE_DEVICES=6 python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/relu/relu_gpt2_digits=20_bs=128 \
#     --checkpoint_id 15640 \
#     --dataset_path /mnt/nfs/data/small/relu/n=20/data.test \
#     --visualize_attention 

# CUDA_VISIBLE_DEVICES=7 python3 src/evaluation_gpt.py \
#     --model_path /mnt/nfs/results/small/relu/relu_gpt2_digits=20_bs=128_inverse \
#     --checkpoint_id 15640 \
#     --dataset_path /mnt/nfs/data/small/relu/n=20/data-inv.test \
#     --visualize_attention