"""
REPRODUCIBILITY GUIDE

This document provides the necessary configurations to reproduce the experimental 
results using this script (`diffpc_flip.py`).

===================
Prerequisites
===================

1.  Install Dependencies: Ensure you have PyTorch and Torchvision installed.
    pip install torch torchvision

2.  Hardware: A CUDA-enabled GPU is required, as the configurations 
    specify a CUDA device.

===================
How to Run an Experiment
===================

To run a specific experiment, you need to modify the `if __name__ == "__main__":` 
block at the bottom of this file. Each section below provides the exact 
`DiffPCConfig` instance to use for that experiment.

Procedure:
1.  Navigate to the bottom of this file.
2.  Replace the entire `cfg = DiffPCConfig(...)` block with the configuration 
    provided for the desired experiment.
3.  Run the script from your terminal:
    python diffpc_flip.py

===================
Experiment Configurations
===================

----------------------------------------------------------------------
1. MNIST with a 784-400-10 Network
----------------------------------------------------------------------
This configuration trains a network with one hidden layer of 400 units on 
the standard MNIST dataset.

Expected Test Accuracy: ~98.33%

To run, use this block:
------------------------
if __name__ == "__main__":
    cfg = DiffPCConfig(
        layer_dims=[784, 400, 10],
        lt_m=0,
        lt_n=5,
        lt_a=1.0,
        lt_scheduler_type="cyclic_phase",
        gamma_value=0.05,
        gamma_every_n=None,
        t_init_cycles=15,
        phase2_cycles=15,
        pc_lr=0.0001,
        batch_size=256,
        epochs=200,
        use_adamw=True,
        adamw_weight_decay=0.01,
        adamw_betas=(0.9, 0.999),
        adamw_eps=1e-08,
        clip_grad_norm=1.0,
        seed=2,
        run_name="mnist_400h",
        use_fashion_mnist=False,
        dropout_rate=0.5,
        v1_dropout=False,
        random_crop_padding=2,
        normalize=True,
        fmnist_hflip_p=0.0,
        device="cuda:0" # Adjust device ID if necessary
    )
    main(cfg)

----------------------------------------------------------------------
2. MNIST with a 784-1024-512-10 Network
----------------------------------------------------------------------
This configuration trains a deeper network with two hidden layers on the MNIST dataset.

Expected Test Accuracy: ~99.33%

To run, use this block:
------------------------
if __name__ == "__main__":
    cfg = DiffPCConfig(
        layer_dims=[784, 1024, 512, 10],
        lt_m=0,
        lt_n=8,
        lt_a=1.0,
        lt_scheduler_type="cyclic_phase",
        gamma_value=0.05,
        gamma_every_n=None,
        t_init_cycles=15,
        phase2_cycles=15,
        pc_lr=0.0001,
        batch_size=256,
        epochs=200,
        use_adamw=True,
        adamw_weight_decay=0.01,
        adamw_betas=(0.9, 0.999),
        adamw_eps=1e-08,
        clip_grad_norm=1.0,
        seed=3,
        run_name="mnist_1024_512h",
        use_fashion_mnist=False,
        dropout_rate=0.5,
        v1_dropout=False,
        random_crop_padding=2,
        normalize=True,
        fmnist_hflip_p=0.0,
        device="cuda:0" # Adjust device ID if necessary
    )
    main(cfg)

----------------------------------------------------------------------
3. Fashion-MNIST with a 784-400-10 Network
----------------------------------------------------------------------
This configuration trains on the Fashion-MNIST dataset. It uses a higher 
gamma_value and no data normalization or random cropping.

Expected Test Accuracy: ~89.25%

To run, use this block:
------------------------
if __name__ == "__main__":
    cfg = DiffPCConfig(
        layer_dims=[784, 400, 10],
        lt_m=0,
        lt_n=8,
        lt_a=1.0,
        lt_scheduler_type="cyclic_phase",
        gamma_value=0.2,
        gamma_every_n=None,
        t_init_cycles=15,
        phase2_cycles=15,
        pc_lr=0.0001,
        batch_size=256,
        epochs=200,
        use_adamw=True,
        adamw_weight_decay=0.01,
        adamw_betas=(0.9, 0.999),
        adamw_eps=1e-08,
        clip_grad_norm=1.0,
        seed=1,
        run_name="fmnist_400h",
        use_fashion_mnist=True,
        dropout_rate=0.5,
        v1_dropout=False,
        random_crop_padding=0,
        normalize=False,
        fmnist_hflip_p=0.0,
        device="cuda:0" # Adjust device ID if necessary
    )
    main(cfg)

----------------------------------------------------------------------
4. Fashion-MNIST with a 784-1000-10 Network and Augmentation
----------------------------------------------------------------------
This configuration uses a larger hidden layer and introduces horizontal 
flipping as data augmentation for Fashion-MNIST.

Expected Test Accuracy: ~89.68%

To run, use this block:
------------------------
if __name__ == "__main__":
    cfg = DiffPCConfig(
        layer_dims=[784, 1000, 10],
        lt_m=0,
        lt_n=8,
        lt_a=1.0,
        lt_scheduler_type="cyclic_phase",
        gamma_value=0.2,
        gamma_every_n=None,
        t_init_cycles=15,
        phase2_cycles=15,
        pc_lr=0.0001,
        batch_size=256,
        epochs=200,
        use_adamw=True,
        adamw_weight_decay=0.01,
        adamw_betas=(0.9, 0.999),
        adamw_eps=1e-08,
        clip_grad_norm=1.0,
        seed=1,
        run_name="fmnist_1000h_augment",
        use_fashion_mnist=True,
        dropout_rate=0.5,
        v1_dropout=False,
        random_crop_padding=0,
        normalize=False,
        fmnist_hflip_p=0.5,
        device="cuda:0" # Adjust device ID if necessary
    )
    main(cfg)
"""