# relearn_attack.py
import os
import argparse
import random
import torch
from torch.utils.data import DataLoader, Subset, SequentialSampler, DistributedSampler
from transformers import AutoModelForCausalLM, AutoTokenizer
from peft import PeftModel
from torch.nn.utils.rnn import pad_sequence
from utils.data_loader_wmdp import get_train_data_ddp, LanguageModelingDataset
os.environ.setdefault("MASTER_ADDR", "127.0.0.1")
os.environ.setdefault("MASTER_PORT", "29500")
access_token = "your_huggingface_access_token"

def parse_args():
    parser = argparse.ArgumentParser(description="Relearning Attack Script")
    parser.add_argument("--model_name",type=str,required=True,help="基座模型名称（HuggingFace 上的 ID），例如 mistralai/Mistral-7B-v0.1")
    parser.add_argument("--model_path",type=str,required=True,help="已有 LoRA 微调模型所在的目录（即之前训练后保存的 LoRA adapter 目录）")
    parser.add_argument("--save_path",type=str,required=True,help="Relearn Attack 完成后新的 LoRA adapter 保存目录")
    parser.add_argument("--dataset",type=str,required=True,help="数据集名称，默认为 wmdp-bio")
    parser.add_argument("--batch_size",type=int,required=True,help="Relearn 微调时的 batch_size")
    parser.add_argument( "--lr", type=float, required=True, help="Relearn 微调时的学习率")
    parser.add_argument("--num_epochs",type=int,required=True,help="Relearn 微调的 epoch 数")
    parser.add_argument("--seed",type=int,required=True,help="随机种子")
    return parser.parse_args()

def main():
    args = parse_args()
    # 固定随机种子，确保可复现
    torch.manual_seed(args.seed)
    random.seed(args.seed)

    # 1. 设备设置：优先使用 cuda:0
    device = torch.device("cuda:1" if torch.cuda.is_available() else "cpu")
    print(f"Using device: {device}")

    # 2. 加载 tokenizer
    #    注意：LoRA 保存目录里通常也会保存 tokenizer，所以先尝试从 model_path 加载 tokenizer
    try:
        tokenizer = AutoTokenizer.from_pretrained(args.model_path, use_fast=True)
        print(f"Loaded tokenizer from {args.model_path}")
    except Exception as e:
        print(f"无法从 {args.model_path} 加载 tokenizer，将尝试从 {args.model_name} 加载：{e}")
        tokenizer = AutoTokenizer.from_pretrained(args.model_name, use_fast=True)

    def collate_fn(batch):
        """
        batch 是一个 list，每个元素是来自 LanguageModelingDataset 的 dict，包含键 'input_ids'、'attention_mask'。
        我们对它们进行 pad_sequence，使同一 batch 内长度一致。
        """
        input_ids_list = [torch.tensor(item["input_ids"], dtype=torch.long) for item in batch]
        attention_mask_list = [torch.tensor(item["attention_mask"], dtype=torch.long) for item in batch]
        # pad 到当前 batch 内的最大长度
        input_ids_padded = pad_sequence(input_ids_list, batch_first=True, padding_value=tokenizer.pad_token_id)
        attention_mask_padded = pad_sequence(attention_mask_list, batch_first=True, padding_value=0)
        return {
            "input_ids": input_ids_padded,
            "attention_mask": attention_mask_padded
        }

    # 3. 加载基座模型 + LoRA adapter
    print("Loading base model and LoRA adapter...")
    base_model = AutoModelForCausalLM.from_pretrained(
        args.model_name,
        torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
        use_cache=False
    )
    model = PeftModel.from_pretrained(base_model, args.model_path, torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32)
    model = model.to(device)
    model.train()

    for name, param in model.named_parameters():
        if "lora" in name.lower():
            param.requires_grad = True
        else:
            param.requires_grad = False
    # 4. 构造“从 forget 集合中随机抽取 600 条样本”的 DataLoader
    #    我们调用 get_train_data_ddp，但由于只用单卡，所以 world_size=1, rank=0，sampler_cls=SequentialSampler
    print("Building forget DataLoader for sampling 600 examples...")
    if args.dataset == "wmdp-cyber":
        forget_corpora, retain_corpora = ["cyber-forget-corpus"], ["cyber-retain-corpus"]
        all_forget_loaders, _ = get_train_data_ddp(
            forget_corpora, retain_corpora, tokenizer,
            batch_size=args.batch_size,
            sampler_cls=DistributedSampler,  # 让每个进程切片
            world_size=1, rank=0
        )
    elif args.dataset == "wmdp-bio":
        forget_corpora, retain_corpora = ["bio_forget"], ["bio-retain-corpus"]
        all_forget_loaders, _ = get_train_data_ddp(
            forget_corpora, retain_corpora, tokenizer,
            batch_size=args.batch_size,
            sampler_cls=DistributedSampler,  # 让每个进程切片
            world_size=1, rank=0
        )
    else:
        raise ValueError(f"Unsupported dataset: {args.dataset}")
    # get_train_data_ddp 返回的 forget_loaders 通常是一个长度与 forget_corpora 等长的列表
    forget_loader_full = all_forget_loaders[0]  # 假设只有一个 forget corpora
    full_dataset = forget_loader_full.dataset  # 应该是 LanguageModelingDataset

    total_num = len(full_dataset)
    print(f"Total forget samples in dataset: {total_num}")
    if total_num < 60:
        raise ValueError(f"忘却集合样本数量仅有 {total_num}，不足 60 条。")

    # 随机抽 60 个索引
    selected_indices = random.sample(range(total_num), 60)
    # 用 Subset 构造只保留这 60 条样本的子数据集
    subset_dataset = Subset(full_dataset, selected_indices)

    # 用常规 DataLoader 将 60 条样本打包，shuffle=True
    relearn_loader = DataLoader(
        subset_dataset,
        batch_size=args.batch_size,
        collate_fn=collate_fn,
        shuffle=True,
        drop_last=False
    )
    print(f"抽取了 60 条 forget 样本，总 dataset 长度 {total_num}，已构造 Relearn DataLoader，batch_size={args.batch_size}")

    # 5. 定义优化器
    optimizer = torch.optim.AdamW(model.parameters(), lr=args.lr)

    # 6. Relearn 微调循环（默认为 1 个 epoch）
    print("Starting Relearn fine-tuning (Relearning Attack)...")
    for epoch in range(args.num_epochs):
        epoch_loss = 0.0
        step = 0
        for batch in relearn_loader:
            step += 1
            input_ids = batch["input_ids"].to(device)         # [batch_size, seq_len]
            attention_mask = batch["attention_mask"].to(device)  # [batch_size, seq_len]

            # LM HEAD 训练：labels = input_ids，模型会自行计算 shift
            outputs = model(
                input_ids=input_ids,
                attention_mask=attention_mask,
                labels=input_ids
            )
            loss = outputs.loss
            optimizer.zero_grad()
            loss.backward()
            optimizer.step()

            epoch_loss += loss.item()
            if step % 10 == 0 or step == len(relearn_loader):
                print(f"[Epoch {epoch+1} Step {step}/{len(relearn_loader)}] loss = {loss.item():.4f}")

        avg_loss = epoch_loss / len(relearn_loader)
        print(f"==> Epoch {epoch+1} done, average loss = {avg_loss:.4f}")

    # 7. 保存微调后的 LoRA adapter
    print(f"Saving Relearn 后的 LoRA 模型到 {args.save_path} ...")
    os.makedirs(args.save_path, exist_ok=True)
    model.save_pretrained(args.save_path)
    tokenizer.save_pretrained(args.save_path)
    print("✅ Relearn Attack 完成，模型已保存。")

if __name__ == "__main__":
    main()
