import torch
import numpy as np
import matplotlib.pyplot as plt
from sklearn.manifold import TSNE

# Load files
clean = torch.load("test_flowers.pt", map_location='cpu')
backdoored = torch.load("test_backdoored_flowers.pt", map_location='cpu')

# Extract embeddings
clean_emb = clean['image_features']
backdoor_emb = backdoored['image_features']

# Convert to numpy
clean_np = clean_emb.numpy()
backdoor_np = backdoor_emb.numpy()

# Combine for t-SNE
X = np.vstack([clean_np, backdoor_np])
y = np.array([0] * len(clean_np) + [1] * len(backdoor_np))  # 0 = clean, 1 = backdoored

# Run t-SNE
tsne = TSNE(n_components=2, perplexity=30, random_state=42)
X_2d = tsne.fit_transform(X)

# Plot
plt.figure(figsize=(8, 6))
plt.scatter(X_2d[y == 0, 0], X_2d[y == 0, 1], c='blue', label='Clean', alpha=0.6)
plt.scatter(X_2d[y == 1, 0], X_2d[y == 1, 1], c='red', label='Backdoored', alpha=0.6)
plt.legend()
plt.title('t-SNE of Text Embeddings (Clean vs Backdoored)')
plt.tight_layout()
plt.savefig("tsne_clean_vs_backdoor_image_flowers.png", dpi=300)
plt.show()
