#!/bin/bash

# model="./outputs/qwen3-8b/wiki_structural_sparsity_16_0.5"
# mmlu truthfulqa-multi commonsense_qa openbookqa medmcqa mathqa inverse_scaling_mc
# baseline=${1:-False}
# for model in llama-7b; do # mistral-7b llama-8b mistralv3-7b 
#     model_name="./outputs/${model}/wiki_structural_sparsity_1_0.5"
#     for task in openbookqa piqa winogrande boolq sciq hellaswag arc_easy arc_challenge; do # sciq hellaswag arc_easy arc_challenge
#         for num_extra_neurons in 1; do
#             python -m eval.eval \
#                 --model_name "${model_name}" \
#                 --task_name ${task} \
#                 --num_extra_neurons ${num_extra_neurons} \
#                 --baseline ${baseline} 
#         done
#     done
# done
# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name "./outputs/llama-7b/wiki_structural_sparsity_1_0.5" \
#     --task_name openbookqa \
#     --num_extra_neurons 1 \
#     --baseline False

# model_name="./outputs/llama-8b/wiki_structural_sparsity_1_0.6"
# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name "${model_name}" \
#     --task_name openbookqa \
#     --num_extra_neurons 1 \
#     --baseline False &
# for rank in 1 2 32; do #llama-8b 
#     model_name="./outputs/lora-llama-8b/wiki_rank_${rank}"
#     CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#         --model_name "${model_name}" \
#         --performance_dir ./performance/ \
#         --task_name piqa \
#         --num_extra_neurons $rank \
#         --pruning_ratio 0.5 \
#         --lora True \ &
#     CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#         --model_name "${model_name}" \
#         --performance_dir ./performance/ \
#         --task_name winogrande \
#         --num_extra_neurons $rank \
#         --pruning_ratio 0.5 \
#         --lora True \ &
#     CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#         --model_name "${model_name}" \
#         --performance_dir ./performance/ \
#         --task_name boolq \
#         --num_extra_neurons $rank \
#         --pruning_ratio 0.5 \
#         --lora True \ &
#     # CUDA_VISIBLE_DEVICES=5 python -m eval.eval \
#     #     --model_name "${model_name}" \
#     #     --task_name hellaswag \
#     #     --num_extra_neurons 1 \
#     #     --pruning_ratio 0.6 \
#     #     --baseline False &
#     CUDA_VISIBLE_DEVICES=6 python -m eval.eval \
#         --model_name "${model_name}" \
#         --performance_dir ./performance/ \
#         --task_name arc_easy \
#         --num_extra_neurons $rank \
#         --pruning_ratio 0.5 \
#         --lora True \ &
#     CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#         --model_name "${model_name}" \
#         --performance_dir ./performance/ \
#         --task_name arc_challenge \
#         --num_extra_neurons $rank \
#         --pruning_ratio 0.5 \
#         --lora True \ &
#     wait
        
# done

# model_name="./outputs/lora-llama-8b/wiki_rank_${rank}"
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name "./outputs/lora-llama-8b/wiki_rank_1" \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --pruning_ratio 0.5 \
#     --lora True \ &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name "./outputs/lora-llama-8b/wiki_rank_2" \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 2 \
#     --pruning_ratio 0.5 \
#     --lora True \ &
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name "./outputs/lora-llama-8b/wiki_rank_4" \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 4 \
#     --pruning_ratio 0.5 \
#     --lora True \ &
# CUDA_VISIBLE_DEVICES=5 python -m eval.eval \
#     --model_name "./outputs/lora-llama-8b/wiki_rank_8" \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 8 \
#     --pruning_ratio 0.5 \
#     --lora True \ &
# CUDA_VISIBLE_DEVICES=6 python -m eval.eval \
#     --model_name "./outputs/lora-llama-8b/wiki_rank_16" \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 16 \
#     --pruning_ratio 0.5 \
#     --lora True \ &
# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name "./outputs/lora-llama-8b/wiki_rank_32" \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 32 \
#     --pruning_ratio 0.5 \
#     --lora True \ &
# wait

# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name ./outputs/deepseek-spon-wiki \
#     --performance_dir ./performance/ \
#     --task_name winogrande \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --lora True 

# model_name="./outputs/mistralv3-7b/wiki_structural_sparsity_1_0.0"
# for baseline in False True
# do
#     for pruning_ratio in 0.0 0.1 0.2 0.3 0.4 0.5 0.6
#     do
#         CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#             --model_name $model_name \
#             --performance_dir ./performance/pretrained \
#             --task_name winogrande \
#             --num_extra_neurons 1 \
#             --baseline $baseline \
#             --pruning_ratio $pruning_ratio &
#         CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#             --model_name $model_name \
#             --performance_dir ./performance/pretrained \
#             --task_name piqa \
#             --num_extra_neurons 1 \
#             --baseline $baseline \
#             --pruning_ratio $pruning_ratio &
#         CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#             --model_name $model_name \
#             --performance_dir ./performance/pretrained \
#             --task_name boolq \
#             --num_extra_neurons 1 \
#             --baseline $baseline \
#             --pruning_ratio $pruning_ratio &
#         CUDA_VISIBLE_DEVICES=5 python -m eval.eval \
#             --model_name $model_name \
#             --performance_dir ./performance/pretrained \
#             --task_name arc_challenge \
#             --num_extra_neurons 1 \
#             --baseline $baseline \
#             --pruning_ratio $pruning_ratio &
#         CUDA_VISIBLE_DEVICES=6 python -m eval.eval \
#             --model_name $model_name \
#             --performance_dir ./performance/pretrained \
#             --task_name arc_easy \
#             --num_extra_neurons 1 \
#             --baseline $baseline \
#             --pruning_ratio $pruning_ratio &
#         wait
#     done
# done

# model_name="./outputs/mistralv3-7b/wiki_structural_sparsity_1_0.0"
# for baseline in False
# do
#     for task in arc_easy arc_challenge boolq piqa winogrande mmlu
#     do
#         CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#             --model_name $model_name \
#             --performance_dir ./performance/pretrained \
#             --task_name $task \
#             --num_extra_neurons 1 \
#             --baseline $baseline \
#             --pruning_ratio 0.0 &
#         CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#             --model_name $model_name \
#             --performance_dir ./performance/pretrained \
#             --task_name $task \
#             --num_extra_neurons 1 \
#             --baseline $baseline \
#             --pruning_ratio 0.1 &
#         CUDA_VISIBLE_DEVICES=5 python -m eval.eval \
#             --model_name $model_name \
#             --performance_dir ./performance/pretrained \
#             --task_name $task \
#             --num_extra_neurons 1 \
#             --baseline $baseline \
#             --pruning_ratio 0.2 &
#         CUDA_VISIBLE_DEVICES=6 python -m eval.eval \
#             --model_name $model_name \
#             --performance_dir ./performance/pretrained \
#             --task_name $task \
#             --num_extra_neurons 1 \
#             --baseline $baseline \
#             --pruning_ratio 0.3 &
#         CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#             --model_name $model_name \
#             --performance_dir ./performance/pretrained \
#             --task_name $task \
#             --num_extra_neurons 1 \
#             --baseline $baseline \
#             --pruning_ratio 0.4 &
#         CUDA_VISIBLE_DEVICES=7 python -m eval.eval \
#             --model_name $model_name \
#             --performance_dir ./performance/pretrained \
#             --task_name $task \
#             --num_extra_neurons 1 \
#             --baseline $baseline \
#             --pruning_ratio 0.5 &
#         CUDA_VISIBLE_DEVICES=4 python -m eval.eval \
#             --model_name $model_name \
#             --performance_dir ./performance/pretrained \
#             --task_name $task \
#             --num_extra_neurons 1 \
#             --baseline $baseline \
#             --pruning_ratio 0.6 &
#         wait
#     done
# done
# arc_easy arc_challenge boolq piqa winogrande mmlu


# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name arc_easy \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name arc_challenge \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name winogrande \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name piqa \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --lora True &
# wait

# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-c4 \
#     --performance_dir ./performance/ \
#     --task_name arc_easy \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-c4 \
#     --performance_dir ./performance/ \
#     --task_name arc_challenge \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-c4 \
#     --performance_dir ./performance/ \
#     --task_name winogrande \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 512 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-c4 \
#     --performance_dir ./performance/ \
#     --task_name piqa \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --lora True &
# wait
# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-c4 \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --lora True & 
# # CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
# #     --model_name deepseekv2 \
# #     --performance_dir ./performance/ \
# #     --task_name boolq \
# #     --num_extra_neurons 1 \
# #     --quantization 8bit \
# #     --pruning_ratio 0.5 \
# #     --batch_size 32 \
# #     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-c4 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --lora True & 
# # CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
# #     --model_name deepseekv2 \
# #     --performance_dir ./performance/ \
# #     --task_name mmlu \
# #     --num_extra_neurons 1 \
# #     --quantization 8bit \
# #     --pruning_ratio 0.5 \
# #     --batch_size 128 \
# #     --lora True &
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-c4 \
#     --performance_dir ./performance/ \
#     --task_name wikitext \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --lora True & 
# wait

# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name arc_easy \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --num_experts_per_tok 3 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name arc_challenge \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --num_experts_per_tok 3 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name winogrande \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 512 \
#     --num_experts_per_tok 3 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name piqa \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --num_experts_per_tok 3 \
#     --lora True &
# wait
# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 3 \
#     --lora True & 
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 3 \
#     --lora True & 
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name wikitext \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 3 \
#     --lora True & 
# wait
# for num_experts_per_tok in 2 4 3 5 6
# do
#     CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#         --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#         --performance_dir ./performance/ \
#         --task_name arc_easy \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 256 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#         --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#         --performance_dir ./performance/ \
#         --task_name arc_challenge \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 256 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#         --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#         --performance_dir ./performance/ \
#         --task_name winogrande \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 512 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#         --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#         --performance_dir ./performance/ \
#         --task_name piqa \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 256 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     wait
# done

# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 2 \
#     --lora True & 
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 3 \
#     --lora True & 
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 4 \
#     --lora True & 
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 5 \
#     --lora True & 
# wait

# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 2 \
#     --lora True & 
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 3 \
#     --lora True & 
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 4 \
#     --lora True & 
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 5 \
#     --lora True & 
# wait

# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 6 \
#     --lora True & 
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 6 \
#     --lora True & 
# wait

# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 2 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 4 &
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 5 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 6
# wait
# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 2 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 4 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 5 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 6 \
#     --lora True &
# wait

# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 2 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name deepseekv2 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 4 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 3 \
#     --lora True &
# wait

# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 2 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 4 &
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 5 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name ./outputs/deepseekv2-spon-wiki \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 32 \
#     --num_experts_per_tok 6 \
#     --lora True &
# wait



# for num_experts_per_tok in 2 4 5 6
# do
#     CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#         --model_name deepseekv2 \
#         --performance_dir ./performance/ \
#         --task_name arc_easy \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 256 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#         --model_name deepseekv2 \
#         --performance_dir ./performance/ \
#         --task_name arc_challenge \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 256 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#         --model_name deepseekv2 \
#         --performance_dir ./performance/ \
#         --task_name winogrande \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 512 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#         --model_name deepseekv2 \
#         --performance_dir ./performance/ \
#         --task_name piqa \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 128 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     wait
# done

# for num_experts_per_tok in 3
# do
#     CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#         --model_name ./outputs/deepseekv2-spon-wiki \
#         --performance_dir ./performance/ \
#         --task_name arc_easy \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 256 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#         --model_name ./outputs/deepseekv2-spon-wiki \
#         --performance_dir ./performance/ \
#         --task_name arc_challenge \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 256 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#         --model_name ./outputs/deepseekv2-spon-wiki \
#         --performance_dir ./performance/ \
#         --task_name winogrande \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 512 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#         --model_name ./outputs/deepseekv2-spon-wiki \
#         --performance_dir ./performance/ \
#         --task_name piqa \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 128 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     wait
# done

# for num_experts_per_tok in 2 3 4 5 6 7 8
# do
#     CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#         --model_name olmoe \
#         --performance_dir ./performance/ \
#         --task_name arc_easy \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 1024 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#         --model_name olmoe \
#         --performance_dir ./performance/ \
#         --task_name arc_challenge \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 1024 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#         --model_name olmoe \
#         --performance_dir ./performance/ \
#         --task_name winogrande \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 2048 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#         --model_name olmoe \
#         --performance_dir ./performance/ \
#         --task_name piqa \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 512 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     wait
# done
# boolq 128 
# for num_experts_per_tok in 2 3 4 5 6 7 8
# do
#     CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#         --model_name ./outputs/olmoe-spon-wiki-1e-6/ \
#         --performance_dir ./performance/ \
#         --task_name arc_easy \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 1024 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#         --model_name ./outputs/olmoe-spon-wiki-1e-6/ \
#         --performance_dir ./performance/ \
#         --task_name arc_challenge \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 1024 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#         --model_name ./outputs/olmoe-spon-wiki-1e-6/ \
#         --performance_dir ./performance/ \
#         --task_name winogrande \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 2048 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#         --model_name ./outputs/olmoe-spon-wiki-1e-6/ \
#         --performance_dir ./performance/ \
#         --task_name piqa \
#         --num_extra_neurons 1 \
#         --quantization 8bit \
#         --pruning_ratio 0.5 \
#         --batch_size 512 \
#         --num_experts_per_tok $num_experts_per_tok \
#         --lora True &
#     wait
# done
# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6/ \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 2 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6/ \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 3 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6/ \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 4 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6/ \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 5 \
#     --lora True &
# wait
# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6/ \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 6 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6/ \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 7 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name boolq \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 8 \
#     --lora True &
# wait
# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name olmoe \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 2 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name olmoe \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 3 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name olmoe \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 4 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name olmoe \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 5 \
#     --lora True &
# wait
# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name olmoe \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 6 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name olmoe \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 7 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name olmoe \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 128 \
#     --num_experts_per_tok 8 \
#     --lora True &
# wait


# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --num_experts_per_tok 2 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --num_experts_per_tok 3 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --num_experts_per_tok 4 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --num_experts_per_tok 5 \
#     --lora True &
# wait
# CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --num_experts_per_tok 6 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --num_experts_per_tok 7 \
#     --lora True &
# CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     --model_name ./outputs/olmoe-spon-wiki-1e-6 \
#     --performance_dir ./performance/ \
#     --task_name mmlu \
#     --num_extra_neurons 1 \
#     --quantization 8bit \
#     --pruning_ratio 0.5 \
#     --batch_size 256 \
#     --num_experts_per_tok 8 \
#     --lora True &
# wait

# for model in llama-70b; do # mistral-7b llama-8b mistralv3-7b 
#     model_name="./outputs/${model}-spon-wiki/"
#     # for task in wikitext; do # sciq hellaswag arc_easy arc_challenge
#     # CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     #     --model_name "${model_name}" \
#     #     --task_name "wikitext" \
#     #     --num_extra_neurons 1 \
#     #     --quantization 4bit \
#     #     --pruning_ratio 0.5 \
#     #     --batch_size 4 \
#     #     --baseline True
#     # wait
#     # CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     #     --model_name "${model_name}" \
#     #     --task_name "mmlu" \
#     #     --num_extra_neurons 1 \
#     #     --quantization 4bit \
#     #     --pruning_ratio 0.5 \
#     #     --batch_size 32 \
#     #     --baseline True
#     # wait
#     # CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     #     --model_name "${model_name}" \
#     #     --task_name "arc_challenge" \
#     #     --num_extra_neurons 1 \
#     #     --quantization 4bit \
#     #     --pruning_ratio 0.5 \
#     #     --batch_size 128 \
#     #     --baseline True &
#     # CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     #     --model_name "${model_name}" \
#     #     --task_name "arc_easy" \
#     #     --num_extra_neurons 1 \
#     #     --quantization 4bit \
#     #     --pruning_ratio 0.5 \
#     #     --batch_size 128 \
#     #     --baseline True &
#     # CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     #     --model_name "${model_name}" \
#     #     --task_name "boolq" \
#     #     --num_extra_neurons 1 \
#     #     --quantization 4bit \
#     #     --pruning_ratio 0.5 \
#     #     --batch_size 16 \
#     #     --baseline True &
#     # CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     #     --model_name "${model_name}" \
#     #     --task_name "piqa" \
#     #     --num_extra_neurons 1 \
#     #     --quantization 4bit \
#     #     --pruning_ratio 0.5 \
#     #     --batch_size 128 \
#     #     --baseline True &
#     # CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#     #     --model_name "${model_name}" \
#     #     --task_name "winogrande" \
#     #     --num_extra_neurons 1 \
#     #     --quantization 4bit \
#     #     --pruning_ratio 0.5 \
#     #     --batch_size 512 \
#     #     --baseline True &
#     # CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     #     --model_name "${model_name}" \
#     #     --task_name "truthfulqa_gen" \
#     #     --num_extra_neurons 1 \
#     #     --quantization 4bit \
#     #     --pruning_ratio 0.5 \
#     #     --batch_size 128 \
#     #     --baseline True 
    
#     # CUDA_VISIBLE_DEVICES=2 python -m eval.eval \
#     #     --model_name "${model_name}" \
#     #     --task_name "commonsense_qa" \
#     #     --num_extra_neurons 1 \
#     #     --quantization 4bit \
#     #     --pruning_ratio 0.5 \
#     #     --batch_size 256 \
#     #     --baseline True &
#     # CUDA_VISIBLE_DEVICES=3 python -m eval.eval \
#     #     --model_name "${model_name}" \
#     #     --task_name "medmcqa" \
#     #     --num_extra_neurons 1 \
#     #     --quantization 4bit \
#     #     --pruning_ratio 0.5 \
#     #     --batch_size 128 \
#     #     --baseline True &
#     yes | CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#         --model_name "${model_name}" \
#         --task_name "mathqa" \
#         --num_extra_neurons 1 \
#         --quantization 4bit \
#         --pruning_ratio 0.5 \
#         --batch_size 128 \
#         --baseline True 
#     # CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
#     #     --model_name "${model_name}" \
#     #     --task_name "openbookqa" \
#     #     --num_extra_neurons 1 \
#     #     --quantization 4bit \
#     #     --pruning_ratio 0.5 \
#     #     --batch_size 256 \
#     #     --baseline True 
#     done
# done

for baseline in True False
do
    for model in qwen3-32b; do #llama-70b qwen3-32b 
        model_name="./outputs/${model}-spon-wiki/"
        # for task in wikitext; do # sciq hellaswag arc_easy arc_challenge
        CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
            --model_name "${model_name}" \
            --task_name "mmlu" \
            --num_extra_neurons 1 \
            --quantization 4bit \
            --pruning_ratio 0.5 \
            --batch_size 16 \
            --baseline $baseline &
        CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
            --model_name "${model_name}" \
            --task_name "arc_challenge" \
            --num_extra_neurons 1 \
            --pruning_ratio 0.5 \
            --batch_size 64 \
            --baseline $baseline &
        wait
        CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
            --model_name "${model_name}" \
            --task_name "arc_easy" \
            --num_extra_neurons 1 \
            --quantization 8bit \
            --pruning_ratio 0.5 \
            --batch_size 64 \
            --baseline $baseline &
        CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
            --model_name "${model_name}" \
            --task_name "boolq" \
            --num_extra_neurons 1 \
            --quantization 4bit \
            --pruning_ratio 0.5 \
            --batch_size 8 \
            --baseline $baseline &
        wait
        CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
            --model_name "${model_name}" \
            --task_name "piqa" \
            --num_extra_neurons 1 \
            --quantization 4bit \
            --pruning_ratio 0.5 \
            --batch_size 64 \
            --baseline $baseline &
        CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
            --model_name "${model_name}" \
            --task_name "winogrande" \
            --num_extra_neurons 1 \
            --quantization 4bit \
            --pruning_ratio 0.5 \
            --batch_size 256 \
            --baseline $baseline &
        wait
        CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
            --model_name "${model_name}" \
            --task_name "truthfulqa_mc1" \
            --num_extra_neurons 1 \
            --quantization 4bit \
            --pruning_ratio 0.5 \
            --batch_size 64 \
            --baseline $baseline &
        CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
            --model_name "${model_name}" \
            --task_name "commonsense_qa" \
            --num_extra_neurons 1 \
            --quantization 4bit \
            --pruning_ratio 0.5 \
            --batch_size 128 \
            --baseline $baseline &
        wait
        CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
            --model_name "${model_name}" \
            --task_name "medmcqa" \
            --num_extra_neurons 1 \
            --quantization 4bit \
            --pruning_ratio 0.5 \
            --batch_size 64 \
            --baseline $baseline &
        yes | CUDA_VISIBLE_DEVICES=1 python -m eval.eval \
            --model_name "${model_name}" \
            --task_name "mathqa" \
            --num_extra_neurons 1 \
            --quantization 4bit \
            --pruning_ratio 0.5 \
            --batch_size 64 \
            --baseline $baseline &
        wait
        CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
            --model_name "${model_name}" \
            --task_name "openbookqa" \
            --num_extra_neurons 1 \
            --quantization 4bit \
            --pruning_ratio 0.5 \
            --batch_size 128 \
            --baseline $baseline &
        wait
    done
done


# mmlu truthfulqa-multi commonsense_qa openbookqa medmcqa mathqa inverse_scaling_mc

# for model in qwen3-32b; do # mistral-7b llama-8b mistralv3-7b 
#     model_name="./outputs/${model}-spon-wiki/"
#     for task in wikitext; do # sciq hellaswag arc_easy arc_challenge
#         for num_extra_neurons in 1; do
#             CUDA_VISIBLE_DEVICES=0 python -m eval.eval \
#                 --model_name "${model_name}" \
#                 --task_name ${task} \
#                 --num_extra_neurons 1 \
#                 --quantization 4bit \
#                 --pruning_ratio 0.5 \
#                 --batch_size 4 \
#                 --baseline True
#         done
#     done
# done
