from optexp import Experiment, exp_runner_cli
from optexp.datasets.barcoded_mnist import MNISTAndBarcode
from optexp.models.cnn import SimpleMNISTCNN
from optexp.optimizers import (
    SGD_M,
    SGD_NM,
    Adam_M,
    Adam_NM,
    NormSGD_M,
    NormSGD_NM,
    Sign_M,
    Sign_NM,
)
from optexp.problems.classification import FullBatchClassification
from optexp.runner.slurm import slurm_config
from optexp.utils import SEEDS_1, SEEDS_3, lr_grid, starting_grid_for

EPOCHS = 300
group = "SimpleCNN_MNISTBarcoded_FB_normalized_v2"

model = SimpleMNISTCNN()
dataset = MNISTAndBarcode(name="MNIST", batch_size=20_000)
problem = FullBatchClassification(model, dataset)

opts_sparse = starting_grid_for(
    [
        SGD_NM,
        SGD_M,
        Adam_NM,
        Adam_M,
        Sign_NM,
        Sign_M,
        NormSGD_NM,
        NormSGD_M,
    ],
    start=-5,
    end=1,
)

opts_dense = [
    *[SGD_NM(lr) for lr in lr_grid(start=-5, end=0, density=1)],
    *[SGD_M(lr) for lr in lr_grid(start=-5, end=0, density=1)],
    *[Adam_NM(lr) for lr in lr_grid(start=-4, end=-1, density=1)],
    *[Adam_M(lr) for lr in lr_grid(start=-4, end=-1, density=1)],
    *[Sign_NM(lr) for lr in lr_grid(start=-3, end=-1, density=1)],
    *[Sign_M(lr) for lr in lr_grid(start=-4, end=-2, density=1)],
    *[NormSGD_NM(lr) for lr in lr_grid(start=-1, end=1, density=1)],
    *[NormSGD_M(lr) for lr in lr_grid(start=-1, end=1, density=1)],
]

experiments = Experiment.generate_experiments_from_opts_and_seeds(
    opts_and_seeds=[(opts_sparse, SEEDS_1), (opts_dense, SEEDS_3)],
    problem=problem,
    epochs=EPOCHS,
    group=group,
)

SLURM_CONFIG = slurm_config.DEFAULT_GPU_4H

if __name__ == "__main__":
    exp_runner_cli(experiments, slurm_config=SLURM_CONFIG)
