#!/bin/bash

# Change to GraphGPT directory
cd ../LLMPredictor/GraphGPT/

# Create logs directory if it doesn't exist
mkdir -p logs_atk

# Check if required parameters are provided
if [ $# -lt 3 ]; then
    echo "Usage: bash run_graphgpt_atk_trans.sh <dataset_name> <attack> <ptb_rate> [seed] [source_prompt] [gpu_id] [atk_emb_type] [atk_seed]"
    echo "Supported datasets: cora, citeseer, instagram, wikics, pubmed, reddit, photo, history, computer, arxiv"
    echo "Supported attacks: pgd, grbcd, prbcd, text_fooler"
    echo "Source prompt options: None, noise, noisetxt"
    echo "Example: bash run_graphgpt_atk_trans.sh cora pgd 0.1 0 noise 0 bow 0"
    exit 1
fi

DATASET=$1
ATTACK=$2
PTB_RATE=$3
SEED=${4:-0}           # Default seed is 0
SOURCE_PROMPT=${5:-None}  # Default source_prompt is None
GPU_ID=${6:-0}         # Default GPU ID is 0
ATK_EMB_TYPE=${7:-bow} # Default attack embedding type is bow
ATK_SEED=${8:-$SEED}   # Default attack seed is same as data seed

# Construct source prompt argument
if [ "$SOURCE_PROMPT" = "None" ] || [ "$SOURCE_PROMPT" = "none" ] || [ -z "$SOURCE_PROMPT" ]; then
    SOURCE_PROMPT_ARG=""
    NOISE_SUFFIX=""
else
    SOURCE_PROMPT_ARG="--source_prompt=$SOURCE_PROMPT"
    NOISE_SUFFIX="_${SOURCE_PROMPT}"
fi

# Determine attack type based on attack name
if [[ "$ATTACK" == "textfooler" || "$ATTACK" == "llm" || "$ATTACK" == "gpt" ]]; then
    ATK_TYPE="text"
else
    ATK_TYPE="structure"
fi

echo "Starting GraphGPT attack evaluation at $(date)..."
echo "Dataset: $DATASET, Attack: $ATTACK, PTB Rate: $PTB_RATE, Seed: $SEED, Source Prompt: $SOURCE_PROMPT, GPU: $GPU_ID"
echo "Attack Embedding Type: $ATK_EMB_TYPE, Attack Seed: $ATK_SEED, Attack Type: $ATK_TYPE"

# Define Python commands based on dataset
if [ "$DATASET" = "cora" ] || [ "$DATASET" = "citeseer" ] || [ "$DATASET" = "instagram" ]; then
    # For cora, citeseer, instagram: transductive setting (re_split=1, s2_epoch=20)
    echo "Running $DATASET with standard configuration..."
    python3 -u main_atk.py --dataset=$DATASET --do_stage1=0 --seed=$SEED --load_ground_embedding=0 --re_split=1 --s2_epoch=20 --gpu_id=$GPU_ID --s2_batch_size=16 --attack=$ATTACK --atk_type=$ATK_TYPE --ptb_rate=$PTB_RATE --atk_emb_type=$ATK_EMB_TYPE --atk_seed=$ATK_SEED $SOURCE_PROMPT_ARG 2>&1 | tee ./logs_atk/attack_transductive_${DATASET}_${ATTACK}_${ATK_TYPE}_ptb${PTB_RATE//.}_${ATK_EMB_TYPE}_atkseed${ATK_SEED}_seed${SEED}${NOISE_SUFFIX}.log

elif [ "$DATASET" = "wikics" ] || [ "$DATASET" = "pubmed" ]; then
    # For wikics, pubmed: s1_epoch=1, s2_epoch=10
    echo "Running $DATASET with wikics/pubmed configuration..."
    python3 -u main_atk.py --dataset=$DATASET --do_stage1=1 --s1_epoch=1 --seed=$SEED --load_ground_embedding=0 --re_split=1 --s2_epoch=10 --gpu_id=$GPU_ID --s2_batch_size=16 --attack=$ATTACK --atk_type=$ATK_TYPE --ptb_rate=$PTB_RATE --atk_emb_type=$ATK_EMB_TYPE --atk_seed=$ATK_SEED $SOURCE_PROMPT_ARG 2>&1 | tee ./logs_atk/attack_transductive_${DATASET}_${ATTACK}_${ATK_TYPE}_ptb${PTB_RATE//.}_${ATK_EMB_TYPE}_atkseed${ATK_SEED}_seed${SEED}${NOISE_SUFFIX}.log

elif [ "$DATASET" = "reddit" ] || [ "$DATASET" = "photo" ] || [ "$DATASET" = "history" ] || [ "$DATASET" = "computer" ]; then
    # For reddit, photo, history, computer: s1_epoch=1, s2_epoch=4
    echo "Running $DATASET with large dataset configuration..."
    python3 -u main_atk.py --dataset=$DATASET --do_stage1=1 --s1_epoch=1 --seed=$SEED --load_ground_embedding=0 --re_split=1 --s2_epoch=4 --s2_batch_size=16 --gpu_id=$GPU_ID --attack=$ATTACK --atk_type=$ATK_TYPE --ptb_rate=$PTB_RATE --atk_emb_type=$ATK_EMB_TYPE --atk_seed=$ATK_SEED $SOURCE_PROMPT_ARG 2>&1 | tee ./logs_atk/attack_transductive_${DATASET}_${ATTACK}_${ATK_TYPE}_ptb${PTB_RATE//.}_${ATK_EMB_TYPE}_atkseed${ATK_SEED}_seed${SEED}${NOISE_SUFFIX}.log
else
    echo "Error: Unsupported dataset '$DATASET'"
    echo "Supported datasets: cora, citeseer, instagram, wikics, pubmed, reddit, photo, history, computer, arxiv"
    exit 1
fi

echo "GraphGPT attack evaluation completed at $(date). Check log files for results." 