"""
Multi-Modal Biometric Dataset for Adversarial Robustness Research
Generated by AI Research Agent for Agents4Science 2025
"""

import torch
from torch.utils.data import Dataset
import numpy as np
import os
from scipy.signal import butter, lfilter
import librosa
import cv2

class ResearchDataset(Dataset):
    def __init__(self, data_path=None, transform=None, mode='train', num_subjects=10000, samples_per_subject=10):
        self.data_path = data_path
        self.transform = transform
        self.mode = mode
        self.num_subjects = num_subjects
        self.samples_per_subject = samples_per_subject
        self.data = self.generate_synthetic_data()

    def generate_synthetic_data(self):
        # Create data with subject/class-specific patterns
        # Add realistic artifacts and variations
        all_data = []
        for subject_id in range(self.num_subjects):
            for _ in range(self.samples_per_subject):
                # Face data: 224x224 RGB image
                face_pattern = np.random.rand(224, 224, 3) * 0.1 + (subject_id % 255) / 255.0
                face_noise = np.random.normal(0, 0.02, (224, 224, 3))
                face_data = np.clip(face_pattern + face_noise, 0, 1).astype(np.float32)

                # Voice data: 16kHz audio, MFCC-like features
                # Simulate a short audio clip and extract MFCCs
                sr = 16000
                duration = 2 # seconds
                t = np.linspace(0, duration, int(sr * duration), endpoint=False)
                freq_base = 100 + (subject_id % 50) * 5
                voice_pattern = 0.5 * np.sin(2 * np.pi * freq_base * t) + 0.2 * np.sin(2 * np.pi * 2 * freq_base * t)
                voice_noise = np.random.normal(0, 0.01, voice_pattern.shape)
                voice_data_raw = voice_pattern + voice_noise
                # Apply a simple bandpass filter to simulate speech characteristics
                nyq = 0.5 * sr
                low = 300 / nyq
                high = 3400 / nyq
                b, a = butter(5, [low, high], btype='band')
                voice_data_filtered = lfilter(b, a, voice_data_raw)
                # Simulate MFCC extraction (simplified)
                mfccs = librosa.feature.mfcc(y=voice_data_filtered, sr=sr, n_mfcc=13)
                # Pad or truncate to a fixed length for consistency
                fixed_length = 100 # Example fixed length for MFCC frames
                if mfccs.shape[1] < fixed_length:
                    voice_data = np.pad(mfccs, ((0,0),(0, fixed_length - mfccs.shape[1])), 'constant')
                else:
                    voice_data = mfccs[:, :fixed_length]
                voice_data = voice_data.astype(np.float32)

                # Behavioral data: 30-dimensional feature vectors
                behavioral_pattern = np.random.rand(30) * 0.1 + (subject_id % 10) / 10.0
                behavioral_noise = np.random.normal(0, 0.01, 30)
                behavioral_data = np.clip(behavioral_pattern + behavioral_noise, 0, 1).astype(np.float32)

                all_data.append({
                    'face': face_data,
                    'voice': voice_data,
                    'behavioral': behavioral_data,
                    'label': subject_id
                })
        return all_data

    def __len__(self):
        return len(self.data)

    def __getitem__(self, idx):
        sample = self.data[idx]
        face = sample['face']
        voice = sample['voice']
        behavioral = sample['behavioral']
        label = sample['label']

        if self.transform:
            face = self.transform(face)
            # Voice and behavioral transforms would be applied here if needed
            # For simplicity, assuming they are already in desired format or transformed internally

        return {'face': face, 'voice': voice, 'behavioral': behavioral, 'label': label}

if __name__ == '__main__':
    print("Generating synthetic multi-modal dataset...")
    dataset = ResearchDataset(num_subjects=10, samples_per_subject=5)
    print(f"Dataset size: {len(dataset)}")
    sample = dataset[0]
    print(f"Sample 0 - Face shape: {sample['face'].shape}, Voice shape: {sample['voice'].shape}, Behavioral shape: {sample['behavioral'].shape}, Label: {sample['label']}")
    print("Dataset generation complete.")
