"""
Research Framework for Multi-Scale Attention Networks for Medical Image Segmentation
Generated as part of AGI Assignment 1 - Agents4Science 2025
"""

# TASK: Multi-Scale Attention Networks for Medical Image Segmentation
TASK = """
Develop and evaluate a novel Multi-Scale Attention U-Net (MSA-UNet) architecture for medical image segmentation.
The system should address scale variation challenges in medical images through cross-scale attention mechanisms
and boundary-aware loss functions, achieving superior performance while maintaining real-time inference capabilities.
"""

# DATASETS: Specific dataset specifications or generation parameters
DATASETS = {
    "synthetic_medical": {
        "description": "Synthetic medical images with ground truth segmentation masks",
        "image_size": (512, 512),
        "num_classes": 5,  # heart, liver, kidney, lung, brain
        "train_size": 10000,
        "val_size": 2000,
        "test_size": 1000,
        "structures_per_image": (1, 3),  # random number of structures per image
        "scale_range": (32, 256),  # pixel size range for structures
        "noise_level": 0.01,  # Gaussian noise standard deviation
        "augmentation": {
            "flip_prob": 0.5,
            "rotation_range": 15,  # degrees
            "scale_range": (0.9, 1.1),
            "brightness_range": (0.8, 1.2)
        }
    }
}

# BASELINES: Relevant comparison methods (both traditional and modern)
BASELINES = {
    "U-Net": {
        "description": "Original U-Net architecture for medical image segmentation",
        "reference": "Ronneberger et al., 2015",
        "implementation": "Standard encoder-decoder with skip connections"
    },
    "Attention U-Net": {
        "description": "U-Net with attention gates for feature refinement",
        "reference": "Oktay et al., 2018",
        "implementation": "U-Net with attention gates in skip connections"
    },
    "ResNet-50": {
        "description": "ResNet-50 backbone with segmentation head",
        "reference": "He et al., 2016",
        "implementation": "ResNet-50 encoder with upsampling decoder"
    },
    "DeepLabV3+": {
        "description": "DeepLabV3+ with atrous convolutions for multi-scale processing",
        "reference": "Chen et al., 2018",
        "implementation": "Xception backbone with ASPP and decoder"
    }
}

# EVALUATION: Comprehensive metrics including domain-specific ones
EVALUATION = {
    "primary_metrics": {
        "Dice_Score": {
            "description": "Overlap coefficient between predicted and ground truth masks",
            "range": [0, 1],
            "higher_is_better": True,
            "target": 0.85
        },
        "Hausdorff_Distance": {
            "description": "Maximum distance between boundary points",
            "range": [0, inf],
            "higher_is_better": False,
            "target": 5.0
        }
    },
    "secondary_metrics": {
        "Boundary_F1_Score": {
            "description": "F1-score computed on boundary pixels only",
            "range": [0, 1],
            "higher_is_better": True,
            "target": 0.80
        },
        "Inference_Time": {
            "description": "Time to process single image (ms)",
            "range": [0, inf],
            "higher_is_better": False,
            "target": 50.0
        },
        "Memory_Usage": {
            "description": "Peak memory usage during inference (MB)",
            "range": [0, inf],
            "higher_is_better": False,
            "target": 2000.0
        }
    },
    "efficiency_metrics": {
        "Parameter_Count": {
            "description": "Total number of trainable parameters",
            "range": [0, inf],
            "higher_is_better": False,
            "target": 5000000
        },
        "FLOPs": {
            "description": "Floating point operations per inference",
            "range": [0, inf],
            "higher_is_better": False,
            "target": 1000000000
        }
    }
}

# COMPARISON_TEMPLATE: Table format for results presentation
COMPARISON_TEMPLATE = """
| Method | Dice Score | Hausdorff Distance | Boundary F1 | Inference Time (ms) | Parameters | Memory (MB) |
|--------|------------|-------------------|-------------|-------------------|------------|-------------|
| U-Net | {unet_dice:.3f} | {unet_hd:.2f} | {unet_bf1:.3f} | {unet_time:.1f} | {unet_params:,} | {unet_mem:.0f} |
| Attention U-Net | {att_unet_dice:.3f} | {att_unet_hd:.2f} | {att_unet_bf1:.3f} | {att_unet_time:.1f} | {att_unet_params:,} | {att_unet_mem:.0f} |
| ResNet-50 | {resnet_dice:.3f} | {resnet_hd:.2f} | {resnet_bf1:.3f} | {resnet_time:.1f} | {resnet_params:,} | {resnet_mem:.0f} |
| DeepLabV3+ | {deeplab_dice:.3f} | {deeplab_hd:.2f} | {deeplab_bf1:.3f} | {deeplab_time:.1f} | {deeplab_params:,} | {deeplab_mem:.0f} |
| MSA-UNet (Ours) | {msa_dice:.3f} | {msa_hd:.2f} | {msa_bf1:.3f} | {msa_time:.1f} | {msa_params:,} | {msa_mem:.0f} |
"""

# ABLATIONS: List of components to analyze
ABLATIONS = {
    "attention_heads": {
        "description": "Number of attention heads in cross-scale attention",
        "values": [1, 2, 4, 8],
        "default": 4
    },
    "attention_scales": {
        "description": "Number of scales for multi-scale processing",
        "values": [2, 3, 4, 5],
        "default": 4
    },
    "loss_weights": {
        "description": "Weighting between Dice loss and boundary loss",
        "values": [(0.5, 0.5), (0.7, 0.3), (0.8, 0.2), (0.9, 0.1)],
        "default": (0.7, 0.3)
    },
    "skip_connections": {
        "description": "Presence of skip connections in decoder",
        "values": [True, False],
        "default": True
    },
    "attention_position": {
        "description": "Position of attention modules in architecture",
        "values": ["encoder", "decoder", "both", "skip_connections"],
        "default": "both"
    }
}

# IMPLEMENTATION: Detailed specifications for reproducibility
IMPLEMENTATION = {
    "framework": "PyTorch 1.12+",
    "python_version": "3.8+",
    "cuda_version": "11.6+",
    "dependencies": [
        "torch>=1.12.0",
        "torchvision>=0.13.0",
        "numpy>=1.21.0",
        "matplotlib>=3.5.0",
        "seaborn>=0.11.0",
        "scikit-learn>=1.1.0",
        "opencv-python>=4.6.0",
        "tqdm>=4.64.0"
    ],
    "hardware_requirements": {
        "gpu": "NVIDIA GPU with 8GB+ VRAM",
        "ram": "16GB+ system RAM",
        "storage": "10GB+ free space"
    },
    "reproducibility": {
        "random_seed": 42,
        "deterministic": True,
        "cudnn_benchmark": False
    },
    "file_structure": {
        "code/": "Python implementation files",
        "data/": "Dataset and metadata files",
        "results/": "Experimental results and figures",
        "paper/": "LaTeX paper and figures",
        "prompts/": "AI contribution logs and prompts"
    }
}

# EXPERIMENTAL_PROTOCOL: Detailed experimental setup
EXPERIMENTAL_PROTOCOL = {
    "training": {
        "epochs": 200,
        "batch_size": 16,
        "optimizer": "Adam",
        "learning_rate": 0.001,
        "weight_decay": 1e-4,
        "scheduler": "StepLR",
        "scheduler_params": {"step_size": 50, "gamma": 0.1},
        "early_stopping": {"patience": 20, "min_delta": 0.001}
    },
    "validation": {
        "frequency": "every epoch",
        "metrics": ["Dice_Score", "Hausdorff_Distance", "Boundary_F1_Score"],
        "save_best": True,
        "save_last": True
    },
    "testing": {
        "metrics": "all_metrics",
        "statistical_tests": ["paired_t_test", "wilcoxon_signed_rank"],
        "confidence_interval": 0.95,
        "multiple_comparison": "bonferroni"
    }
}

