## FV linear superposition
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "clean_Ex1"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "clean_Ex2"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "clean_Ex3"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "clean_Ex4"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "clean_Ex5"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "context_Ex1"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "context_Ex2"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "context_Ex3"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "context_Ex4"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "context_Ex5"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "fully_clean"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# Q patching
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_only_context_examples"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --corruption_with_ablation\
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_only_context_xn"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --corruption_with_ablation\
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_all"\
   --token_types 8\
   --corrupted_dataset_name "country-capital.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# Full Model
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_all"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

#all-unambiguous
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_all"\
   --token_types 8\
   --corrupted_dataset_name "chinese-all-unambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# other task x4
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_all"\
   --token_types 8\
   --corrupted_dataset_name "chinese-all-unambiguous-x.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# other task examples
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_all"\
   --token_types 8\
   --corrupted_dataset_name "chinese-other-task-x.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# x -> x
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_all"\
   --token_types 8\
   --corrupted_dataset_name "chinese-xx.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# y -> y
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_all"\
   --token_types 8\
   --corrupted_dataset_name "chinese-yy.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# y -> x
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_all"\
   --token_types 8\
   --corrupted_dataset_name "chinese-yx.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# other x -> y
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_all"\
   --token_types 8\
   --corrupted_dataset_name "chinese-other-x.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# x -> other y
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_all"\
   --token_types 8\
   --corrupted_dataset_name "chinese-other-y.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# x -> y shuffled
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_all"\
   --token_types 8\
   --corrupted_dataset_name "chinese-shuffled.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# fully-clean
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "fully_clean"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# fully-clean change ambig K to unambig K
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "fully_clean_k_all_clean_Ex135"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous-k-un.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --corruption_with_ablation\
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# fully-clean change unambig K to ambig K
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "fully_clean_k_all_clean_Ex24"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous-k-am.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --corruption_with_ablation\
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --device "cuda" \
   --seed 42

# Full Model Q + Fully Clean K/V
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "fully_clean_q_full_model"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --corruption_with_ablation\
   --device "cuda" \
   --seed 42

# Fully Clean Q + Full Model K/V
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_q_fully_clean"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --corruption_with_ablation\
   --device "cuda" \
   --seed 42

## Fully Clean Q/K + change Fully Clean unambiguous Examples’ V to Contextualized V
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "fully_clean_v_all_full_model_Ex24"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --corruption_with_ablation\
   --device "cuda" \
   --seed 42

# Fully Model Q/K + change Fully Model unambiguous Examples’ V to Uncontextualized V
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_v_all_clean_Ex24"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --corruption_with_ablation\
   --device "cuda" \
   --seed 42

## Fully Clean Q/K + change all Fully Clean V to Contextualized V
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "fully_clean_v_all_full_model"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --corruption_with_ablation\
   --device "cuda" \
   --seed 42

# Fully Model Q/K + change all Fully Model V to Uncontextualized V
python3 extract_sub_function_vector_per_prompt_5_shot.py \
   --model_name "google/gemma-2-2b" \
   --task_name "chinese-ambiguous" \
   --sub_FV_name "full_model_v_all_clean"\
   --token_types 8\
   --corrupted_dataset_name "chinese-ambiguous.json_5_100" \
   --train_dataset_name "chinese-ambiguous.json_5_100" \
   --inject_dataset_name "chinese-ambiguous.json_0_100" \
   --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
   --corruption_with_ablation\
   --device "cuda" \
   --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
    --model_name "google/gemma-2-2b" \
    --task_name "chinese-ambiguous" \
    --sub_FV_name "full_model"\
    --token_types 8\
    --corrupted_dataset_name "chinese-all-ambiguous.json_5_100" \
    --train_dataset_name "chinese-all-ambiguous.json_5_100" \
    --inject_dataset_name "chinese-ambiguous.json_0_100" \
    --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
    --device "cuda" \
    --seed 42

python3 extract_sub_function_vector_per_prompt_5_shot.py \
    --model_name "google/gemma-2-2b" \
    --task_name "chinese-ambiguous" \
    --sub_FV_name "full_model"\
    --token_types 8\
    --corrupted_dataset_name "chinese-all-unambiguous.json_5_100" \
    --train_dataset_name "chinese-all-unambiguous.json_5_100" \
    --inject_dataset_name "chinese-ambiguous.json_0_100" \
    --CIE_path "mean_causal_indirect_effects_chinese-ambiguous.json_5_100_chinese-ambiguous.json_5_25_corrupted.pt"\
    --device "cuda" \
    --seed 42