#!/bin/bash

set -e  # Exit on any error
cd ..

# # EXP#1 TUNING Step 1: llama-70b-3.3 - done
# python ./scripts/train_test_probes.py \
# --probe-type lr \
# --regularization 1 \
# --use-scale true \
# --layer-idx 3 8 13 18 23 28 33 38 43 48 53 58 63 68 73 78 \
# --train-feature-type average \
# --verbose \
# --model-name llama-70b-3.3 \
# --features-file ./results/extracted_feats_all_layers_llama-70b-3.3.h5 \
# --results-csv ./results/results_llama-70b-3.3_all_layers.csv

# # # EXP#2 TUNING Step 2: llama-70b-3.3 
# for FEATURE in last average all; do
#     for USE_SCALE in true false; do
#         for PROBE_TYPE in diffmean lda; do
#             python ./scripts/train_test_probes.py \
#             --probe-type ${PROBE_TYPE} \
#             --regularization 0 \
#             --layer-idx 33 38 68 73 78 \
#             --train-feature-type ${FEATURE} \
#             --use-scale ${USE_SCALE} \
#             --verbose \
#             --model-name llama-70b-3.3 \
#             --features-file ./results/extracted_feats_all_layers_llama-70b-3.3.h5 \
#             --results-csv ./results/results_llama-70b-3.3_all_layers.csv
#         done

#         python ./scripts/train_test_probes.py \
#             --probe-type lr \
#             --regularization 1e-4 \
#             --layer-idx 33 38 68 73 78 \
#             --train-feature-type ${FEATURE} \
#             --use-scale ${USE_SCALE} \
#             --verbose \
#             --model-name llama-70b-3.3 \
#             --features-file ./results/extracted_feats_all_layers_llama-70b-3.3.h5 \
#             --results-csv ./results/results_llama-70b-3.3_all_layers.csv
#     done
# done

# # EXP#3 TUNING Step 3: layer tuning for other models - llama 8b
# for MODEL in llama-8b llama-8b-base; do
#     python ./scripts/train_test_probes.py \
#     --probe-type lr \
#     --regularization 1e-4 \
#     --layer-idx {0..31} \
#     --train-feature-type average \
#     --use-scale false \
#     --verbose \
#     --model-name ${MODEL} \
#     --features-file ./results/extracted_feats_all_layers_${MODEL}.h5 \
#     --results-csv ./results/results_${MODEL}_all_layers.csv
# done

# main - llama-70b-3.3 & llama-8b
MODEL=llama-70b-3.3
for LAYER in 33; do
    python ./scripts/train_test_probes.py \
    --probe-type lr \
    --regularization 1e-4 \
    --use-scale true \
    --layer-idx ${LAYER} \
    --train-feature-type average \
    --verbose \
    --model-name ${MODEL} \
    --features-file ./results/extracted_feats_all_layers_${MODEL}.h5 \
    --results-csv ./results/results_${MODEL}_all_layers.csv
done

# main - llama-8b for all 32 layers
# for LAYER in {0..27}; do
# for LAYER in 15; do
#     python ./scripts/train_test_probes.py \
#     --probe-type lr \
#     --regularization 1 \
#     --layer-idx ${LAYER} \
#     --train-feature-type average \
#     --verbose \
#     --model-name llama-8b \
#     --features-file ./results/extracted_feats_all_layers_llama-8b.h5 \
#     --results-csv ./results/results_llama-8b_all_layers.csv
# done

# # robustness - llama 70b
# python ./scripts/train_test_probes.py \
# --probe-type lr \
# --regularization 1 \
# --layer-idx 33 \
# --train-feature-type average \
# --verbose \
# --model-name llama-70b-3.3 \
# --features-file ./results/extracted_feats_layer33_llama-70b-3.3.h5 \
# --results-csv ./results/results_llama-70b-3.3_all_layers.csv
# # robustness - llama 70b base
# MODEL_NAME=llama-70b-base
# python ./scripts/train_test_probes.py \
# --probe-type lr \
# --regularization 1 \
# --layer-idx 33 \
# --train-feature-type average \
# --verbose \
# --model-name ${MODEL_NAME} \
# --features-file ./results/extracted_feats_layer33_${MODEL_NAME}.h5 \
# --results-csv ./results/results_${MODEL_NAME}_all_layers.csv

# # robustness - llama 8b
# MODEL_NAME=llama-8b
# python ./scripts/train_test_probes.py \
# --probe-type lr \
# --regularization 1e-4 \
# --use-scaler false \
# --layer-idx 15 \
# --train-feature-type average \
# --verbose \
# --model-name ${MODEL_NAME} \
# --features-file ./results/extracted_feats_all_layers_${MODEL_NAME}.h5 \
# --results-csv ./results/results_${MODEL_NAME}_all_layers.csv
# # robustness - llama 8b base
# MODEL_NAME=llama-8b-base
# python ./scripts/train_test_probes.py \
# --probe-type lr \
# --regularization 1e-4 \
# --use-scaler false \
# --layer-idx 15 \
# --train-feature-type average \
# --verbose \
# --model-name ${MODEL_NAME} \
# --features-file ./results/extracted_feats_all_layers_${MODEL_NAME}.h5 \
# --results-csv ./results/results_${MODEL_NAME}_all_layers.csv

# # robustness - qwen 14b
# MODEL_NAME=qwen-14b
# python ./scripts/train_test_probes.py \
# --probe-type lr \
# --regularization 1 \
# --layer-idx 30 \
# --train-feature-type average \
# --verbose \
# --model-name ${MODEL_NAME} \
# --features-file ./results/extracted_feats_all_layers_${MODEL_NAME}.h5 \
# --results-csv ./results/results_${MODEL_NAME}_all_layers.csv
# # robustness - qwen 14b base
# MODEL_NAME=qwen-14b-base
# python ./scripts/train_test_probes.py \
# --probe-type lr \
# --regularization 1 \
# --layer-idx 30 \
# --train-feature-type average \
# --verbose \
# --model-name ${MODEL_NAME} \
# --features-file ./results/extracted_feats_all_layers_${MODEL_NAME}.h5 \
# --results-csv ./results/results_${MODEL_NAME}_all_layers.csv

# # robustness - qwen 7b
# MODEL_NAME=qwen-7b
# python ./scripts/train_test_probes.py \
# --probe-type lr \
# --regularization 1 \
# --layer-idx 18 \
# --train-feature-type average \
# --verbose \
# --model-name ${MODEL_NAME} \
# --features-file ./results/extracted_feats_all_layers_${MODEL_NAME}.h5 \
# --results-csv ./results/results_${MODEL_NAME}_all_layers.csv
# # robustness - qwen 7b base
# MODEL_NAME=qwen-7b-base
# python ./scripts/train_test_probes.py \
# --probe-type lr \
# --regularization 1 \
# --layer-idx 18 \
# --train-feature-type average \
# --verbose \
# --model-name ${MODEL_NAME} \
# --features-file ./results/extracted_feats_all_layers_${MODEL_NAME}.h5 \
# --results-csv ./results/results_${MODEL_NAME}_all_layers.csv



# # baseline: got
# python ./scripts/train_test_probes.py \
# --probe-type diffmean \
# --regularization 0 \
# --layer-idx 33 \
# --train-feature-type last \
# --train-tasks got__best \
# --verbose

# # baseline: repe
# python ./scripts/train_test_probes.py \
# --probe-type lr \
# --regularization 1 \
# --layer-idx 33 \
# --train-feature-type all \
# --train-tasks repe_honesty__plain \
# --verbose


# for LAYER in 77; do
#     for TRAIN_FEATURE_TYPE in average all last; do
#         python ./scripts/train_test_probes.py \
#         --probe-type lr \
#         --regularization 1 \
#         --layer-idx ${LAYER} \
#         --train-feature-type ${TRAIN_FEATURE_TYPE} \
#         --verbose

#         for PROBE_TYPE in lda pca diffmean; do
#             python ./scripts/train_test_probes.py \
#             --probe-type ${PROBE_TYPE} \
#             --regularization 0 \
#             --layer-idx ${LAYER} \
#             --train-feature-type ${TRAIN_FEATURE_TYPE} \
#             --verbose
#         done
#     done
# done


