import os
import sys

MODEL_PATHs = {
    # LM
    "MiniLM": "/path/to/models/sentence-transformers--all-MiniLM-L6-v2/",
    "SentenceBert": "/path/to/models/sentence-transformers--multi-qa-distilbert-cos-v1/",
    "e5-large": "/path/to/models/intfloat--e5-large-v2/",
    "roberta": "/path/to/models/sentence-transformers--all-roberta-large-v1/",

    # LLM
    "Qwen-3B": "/path/to/models/Qwen--Qwen2.5-3B-Instruct", 
    "Qwen-7B": "/path/to/models/Qwen--Qwen2.5-7B-Instruct",
    "Qwen-14B": "/path/to/models/Qwen--Qwen2.5-14B-Instruct",
    "Qwen-32B": "/path/to/models/Qwen--Qwen2.5-32B-Instruct",
    "Mistral-7B": "/path/to/models/mistral-7B-Instruct",  
    "Ministral-8B": "/path/to/models/ministral-8b-Instruct",
    "Llama3-8B": "/path/to/models/llama-3.1-8B-Instruct/",  
    "Qwen3-8B": "/path/to/models/qwen3-8b"
}
# Base path for saving models
SAVED_MODELS_BASE_PATH = "/path/to/GraphAD_data/saved_models"

def get_model_save_path(model_name, dataset, re_split, llm, seed, atk_name=None, **kwargs):
    """
    Generate unified model save path for different models using underscore separation
    
    Args:
        model_name: "GraphGPT", "LLaGA", "InstructionTuning"
        dataset: dataset name like "cora", "citeseer"
        re_split: 0 (semi-supervised), 1 (supervised), 2 (inductive)
        llm: llm name like "Mistral-7B", "Qwen-7B"
        seed: random seed
        atk_name: attack name, default None
        **kwargs: additional model-specific parameters
            - neighbor_template: for LLaGA (ND/HO)
            - num_epochs/num_epoch: training epochs
            - lm_encoder: for LLaGA encoder type
            - stage_info: for GraphGPT (e.g., "s1_2_s2_10" for s1_epoch=2, s2_epoch=10)
            - prompt: for noise experiments ("noise", "noisetxt", None)
    
    Returns:
        save_path: full path for model saving
    """
    # Determine setting name
    setting_map = {0: "semi", 1: "sup", 2: "ind"}
    setting = setting_map.get(re_split, "unk")
    
    # Build path components with underscore separation
    path_components = [model_name, dataset, setting, llm]
    
    # Add attack name if provided for transductive settings (re_split = 0 or 1)
    if atk_name is not None and re_split != 2:
        # For transductive settings, add attack info to model path
        if isinstance(atk_name, dict):
            # Format: attack_ptbXX for dict-style attack info
            attack_str = f"{atk_name['attack']}_ptb{int(atk_name['ptb_rate']*100)}"
            path_components.append(f"atk_{attack_str}")
        else:
            # Format: attack name string
            path_components.append(f"atk_{atk_name}")

    # Add model-specific info
    extra_info_parts = []
    
    # For LLaGA: neighbor template and encoder
    if model_name == "LLaGA":
        if "neighbor_template" in kwargs:
            extra_info_parts.append(kwargs["neighbor_template"])
        if "lm_encoder" in kwargs and kwargs["lm_encoder"] != "roberta":
            extra_info_parts.append(kwargs["lm_encoder"])
        # Add prompt suffix for LLaGA noise experiments
        if "prompt" in kwargs and kwargs["prompt"] is not None:
            extra_info_parts.append(kwargs["prompt"])
    
    # For GraphGPT: stage information
    elif model_name == "GraphGPT":
        if "stage_info" in kwargs:
            extra_info_parts.append(kwargs["stage_info"])
        elif "s1_epoch" in kwargs and "s2_epoch" in kwargs:
            extra_info_parts.append(f"s1_{kwargs['s1_epoch']}_s2_{kwargs['s2_epoch']}")
        # Add prompt suffix for GraphGPT noise experiments
        if "prompt" in kwargs and kwargs["prompt"] is not None:
            extra_info_parts.append(kwargs["prompt"])
    
    # For InstructionTuning: epoch info
    elif model_name == "InstructionTuning":
        if "num_epoch" in kwargs:
            extra_info_parts.append(f"ep_{kwargs['num_epoch']}")
        if "prompt_type" in kwargs:
            extra_info_parts.append(f"prompt_{kwargs['prompt_type']}")
    
    # General epoch info for LLaGA
    if model_name == "LLaGA" and "num_epochs" in kwargs:
        extra_info_parts.append(f"ep_{kwargs['num_epochs']}")
    
    # Add extra info if any
    if extra_info_parts:
        path_components.append("_".join(extra_info_parts))
    
    # Add seed
    path_components.append(f"seed_{seed}")
    
    # Create final path
    model_dir_name = "_".join(path_components)
    save_path = os.path.join(SAVED_MODELS_BASE_PATH, model_dir_name)
    
    # Create directory if not exists
    os.makedirs(save_path, exist_ok=True)
    
    return save_path


def check_model_exists(save_path, model_files):
    """
    Check if all required model files exist in the save path
    
    Args:
        save_path: path to model directory
        model_files: list of required model files
    
    Returns:
        bool: True if all files exist, False otherwise
    """
    if not os.path.exists(save_path):
        return False
    
    for file_name in model_files:
        file_path = os.path.join(save_path, file_name)
        if not os.path.exists(file_path):
            return False
    
    return True


def get_setting_info(re_split):
    """
    Get setting suffix and setting name based on re_split value
    
    Args:
        re_split: 0 (semi-supervised), 1 (supervised), 2 (inductive)
    
    Returns:
        tuple: (suffix_str, setting_name)
    """
    setting_map = {
        0: ("", "Semi"),
        1: ("_s", "Supervised"), 
        2: ("_inductive", "Inductive")
    }
    return setting_map.get(re_split, ("", "Unknown"))


# LLM API Configurations - Set your own API keys
LLM_API_CONFIGS = {
    "openai": {
        "base_url": "https://api.openai.com/v1",
        "api_key": "your-openai-api-key-here",
        "models": ["gpt-3.5-turbo", "gpt-4", "gpt-4-turbo", "gpt-4o-mini"]
    },
    "deepseek": {
        "base_url": "https://api.deepseek.com",
        "api_key": "your-deepseek-api-key-here", 
        "models": ["deepseek-chat"]
    }
}
