import argparse
import datetime
import itertools
import os
import pathlib
import subprocess
import textwrap

parser = argparse.ArgumentParser()
parser.add_argument(
    "--root_dir",
    type=str,
    required=False,
    default="Path to deterministic base checkpoint",
)
parser.add_argument("--experiment-name", type=str, required=False, default="poseidon")
parser.add_argument("--local", action="store_true")
parser.add_argument("--single-run", action="store_true")
parser.add_argument(
    "--dataset",
    type=str,
    choices=[
        "euler",
        "RB",
        "shear_flow",
    ],
    required=True,
)
args = parser.parse_args()

validation_frequency = 30
if args.dataset == "RB":
    data_name = "rayleigh_benard"
    data_short = "RB"
    num_channels = 4
    max_num_samples_dataset = 10
    sweep_data = [
        {
            "name": "rayleigh_benard",
            "n_steps_input": 6,
            "n_steps_output": 1,
            "max_rollout_steps": 200,
            "image_size": [128, 128],
        },
    ]
    checkpoint_name = "step_200"
    trainer = "defaults_mean"
    num_samples = 4
    if num_samples > 2:
        batch_size = 16
        grad_acc = 1
        max_samples = 500
    elif num_samples == 2:
        batch_size = 32
        grad_acc = 1
        max_samples = 250
elif args.dataset == "euler":
    data_name = "euler_multi_quadrants_periodicBC"
    data_short = "euler"
    num_channels = 5
    max_num_samples_dataset = 6
    sweep_data = [
        {
            "name": "euler_multi_quadrants_periodicBC",
            "n_steps_input": 6,
            "n_steps_output": 1,
            "max_rollout_steps": 100,
            "image_size": [128, 128],
            "prefetch_factor": 2,
            "persistent_workers": True,
        },
    ]
    validation_frequency = 30
    image_size = [128, 128]
    trainer = "defaults_mean"
    num_samples = 4
    if num_samples > 2:
        batch_size = 16
        grad_acc = 1
        max_samples = 500
    elif num_samples == 2:
        batch_size = 32
        grad_acc = 1
        max_samples = 250
elif args.dataset == "shear_flow":
    data_name = "shear_flow"
    data_short = "shear"
    num_channels = 4
    max_num_samples_dataset = 10
    num_samples = 4
    image_size = [128, 128]
    trainer = "defaults_mean"
    if num_samples > 2:
        batch_size = 16
        grad_acc = 1
        max_samples = 500
    elif num_samples == 2:
        batch_size = 32
        grad_acc = 1
        max_samples = 250

    sweep_data = [
        {
            "name": "shear_flow",
            "n_steps_input": 6,
            "n_steps_output": 1,
            "max_rollout_steps": 200,
            "image_size": image_size,
        },
    ]

init_epoch = checkpoint_name.split("_")[-1]
coalesced_checkpoint_path = (
    f"{args.root_dir}/checkpoints/{checkpoint_name}/coalesced.pth"
)
config_override = f"{args.root_dir}/extended_config.yaml"

sweep = {
    "model_name": ["inv_poseidon_L_with_noise"],
    "lr_scheduler": ["inv_sqrt_w_sqrt_ramps"],
    "optimizer": ["adam"],
    "optimizer_lr": [0.0001],
    "common_optimizer_lr": [0.00005],
    "max_samples": [max_samples],
    "loss_multiplier": [1],
    "max_epoch": [100],
    "batch_size": [batch_size],
    "grad_acc_steps": [grad_acc],
    "resize": [True],
    "data": sweep_data,
    "distribution": ["local"],
    "coalesced_checkpoint_path": [coalesced_checkpoint_path],
    "config_override": [config_override],
    "num_samples": [num_samples],
    "noise_dim": [32],
    "mlp_layers": [2],
    "idx_noise_layers": [[0, 1, 2, 3]],
    # Trainer
    "validation_ensemble_size": [16],
    "ensemble_sizes_to_save": ["[1, 2, 4, 8, 16]"],
    "max_num_samples": [max_num_samples_dataset],
    "weight_decay": [0.0001],
    "poseidon_one_sample_norm": [True],
}

# Step 2: Create combinations of all params
keys, values = zip(*sweep.items())
combinations = [dict(zip(keys, combo)) for combo in itertools.product(*values)]

experiment_name = f"_{data_short}"
date_string = datetime.datetime.now().strftime("%d-%m_%H-%M-%S")

username = os.environ["USER"]
slurm_folder = f"/mnt/home/{username}/crps_retrofitting/slurm_outputs/poseidon"
os.makedirs(slurm_folder, exist_ok=True)
current_path = pathlib.Path.cwd()
# Step 3: Generate, submit, and delete sbatch scripts
for i, params in enumerate(combinations):
    warmup_epochs = min(int(0.1 * params["max_epoch"]), 10)
    cooldown_epochs = min(int(0.1 * params["max_epoch"]), 10)
    job_name = f"{params['data']['name']}_job_{i}"
    script_filename = f"{job_name}.sbatch"

    num_injection_layers = len(params["idx_noise_layers"])

    ablate_string = f"{params['max_epoch']}_NS{num_samples}_{params['poseidon_one_sample_norm']}_L{num_injection_layers}_WD{params['weight_decay']}_ckpt{init_epoch}_{params['optimizer_lr']}_{params['common_optimizer_lr']}"

    # Build the python command string
    python_cmd = textwrap.dedent(
        f"""\
        python crps_retrofitting/train.py \
        distribution=local \
        finetune=True \
        frozen_components=[] \
        trainer={trainer} \
        trainer.enable_amp=False \
        trainer.loss_fn._target_=crps_retrofitting.metrics.crps.CRPS \
        ++trainer.ensemble_sizes_to_save='{params['ensemble_sizes_to_save']}' \
        ++trainer.validation_ensemble_size={params['validation_ensemble_size']} \
        ++trainer.max_num_samples={params['max_num_samples']} \
        ++trainer.max_spectral_val_samples=5 \
        ++trainer.poseidon_one_sample_norm={params['poseidon_one_sample_norm']} \
        data={params['data']['name']} \
        model={params['model_name']} \
        model.resize={params['resize']} \
        model.num_channels={num_channels} \
        model.num_out_channels={num_channels} \
        ++model.image_size='{params['data']['image_size']}' \
        model.num_samples={params['num_samples']} \
        model.noise_dim={params['noise_dim']} \
        ++model.idx_noise_layers='{params['idx_noise_layers']}' \
        model.mlp_layers={params['mlp_layers']} \
        trainer.grad_acc_steps={params['grad_acc_steps']} \
        data_workers=10 \
        logger.wandb=True \
        auto_resume=False \
        trainer.max_epoch={params['max_epoch']} \
        optimizer={params['optimizer']} \
        optimizer.lr={params['optimizer_lr']} \
        lr_scheduler={params['lr_scheduler']} \
        lr_scheduler.warmup_epochs={warmup_epochs} \
        lr_scheduler.cooldown_epochs={cooldown_epochs} \
        trainer.loss_multiplier={params['loss_multiplier']} \
        name={experiment_name}_{ablate_string} \
        auto_resume=False \
        trainer.prediction_type="full" \
        ++data.image_size="{params['data']['image_size']}" \
        data.module_parameters.batch_size={params['batch_size']} \
        data.module_parameters.max_samples={params['max_samples']} \
        data.module_parameters.n_steps_input={params['data']['n_steps_input']} \
        data.module_parameters.n_steps_output={params['data']['n_steps_output']} \
        data.module_parameters.inner_dset_type._target_=crps_retrofitting.data.inflated_dataset.BatchWellDataset \
        trainer.max_rollout_steps={params['data']['max_rollout_steps']} \
        ++trainer.reuse_batches=True \
        trainer.val_frequency={validation_frequency} \
        trainer.rollout_val_frequency={validation_frequency} \
        checkpoint.coalesced_checkpoint_path='{params['coalesced_checkpoint_path']}' \
        config_override='{params['config_override']}' \
        ++optimizer.new_params_lr={params['optimizer_lr']} \
        ++optimizer.common_params_lr={params['common_optimizer_lr']} \
        ++optimizer.new_params_kwargs.weight_decay={params['weight_decay']} \
        ++optimizer.new_params_kwargs.eps=1e-10 \
        ++optimizer.common_params_kwargs.weight_decay=0.0001 \
        ++optimizer.common_params_kwargs.eps=1e-10 \
        """
    )

    script_content = textwrap.dedent(
        f"""\
        #!/bin/bash
        #SBATCH --time=7-00:00:00
        #SBATCH --partition=gpu
        #SBATCH --nodes=1
        #SBATCH --gres=gpu:1
        #SBATCH -C h100
        #SBATCH --ntasks-per-node=1
        #SBATCH --gpus-per-node=1
        #SBATCH --cpus-per-gpu=16
        #SBATCH --job-name={job_name}
        #SBATCH --output={slurm_folder}/{params['data']['name']}/{experiment_name}/%j_{job_name}_{date_string}.log

        export OMP_NUM_THREADS=${{SLURM_CPUS_ON_NODE}}
        export HDF5_USE_FILE_LOCKING=FALSE
        export HYDRA_FULL_ERROR=1
        export NCCL_DEBUG=WARN
        export LD_LIBRARY_PATH=""
        module load ffmpeg
        source ./venvs/walrus/bin/activate

        {python_cmd}
        """
    )

    with open(script_filename, "w") as f:
        f.write(script_content)

    if args.local:
        subprocess.run(["bash", script_filename])
    else:
        subprocess.run(["sbatch", script_filename])

    os.remove(script_filename)

    if args.single_run:
        break
