'''
export OMP_NUM_THREADS=16 && torchrun --nproc_per_node=8 -m src.run.orchestrate.experiment.exp_02_realistic
'''

from src.run.orchestrate.config import RealisticBaseArgs, calc_realistic_model_params
from src.run.utils import get_timestamp
from src.run.main import run

from pathlib import Path
from copy import deepcopy

if __name__ == '__main__':
    
    NUM_RUNS = 3
    base_args = deepcopy(RealisticBaseArgs)
    configs = []

    root_dir = Path("src").absolute()
    res_root = root_dir / f"results/realistic/02/combined_{get_timestamp()}"
    do_checkpoint = False

    base_args['aux_labels'] = ["bigcode", "biology", "nuclear", "cyber"]
    base_args['stages'] = [
        # {
        #     "name": "baseline", "ft_forget": True, "do_checkpoint": do_checkpoint,
        # },
        # {
        #    "name": "maxent", "ft_forget": True,
        #    "me_alpha_retain": 100, "me_steps": 400, "me_lr": 5e-5,
        #    "do_checkpoint": False,
        # },
        # {
        #     "name": "coreftaux", "ft_forget": True, "core_prc": 0.8, "aux_prc": 0.5, "do_checkpoint": do_checkpoint,
        # },
        {
            "name": "routed", "arch": "lora", "ordered": True, "ft_forget": True, 
            "core_prc": 0.8, "aux_prc": 0.5, 
            "lora_attn": True, "lora_mlp": True, "expert_dist": "prc_one",
            "equal_compute": True, "do_checkpoint": do_checkpoint,
        },
        # {
        #     "name": "routed", "arch": "moe", "ordered": False, "ft_forget": True, 
        #     "aux_route_prc": 0.75, "robust_prc": 0.5, "expert_dist": "prc_one",
        #     "do_checkpoint": do_checkpoint,
        # },
        # {
        #     "name": "filtering", "ft_forget": True, "do_checkpoint": do_checkpoint
        # },
    ]

    model_params = calc_realistic_model_params(700e6)
    base_args.update(model_params)

    for seed in range(NUM_RUNS):
        run_config = deepcopy(base_args)
        run_config["seed"] = seed
        configs.append(run_config)

    for i, config in enumerate(configs):
        timestamp = get_timestamp()
        config['timestamp'] = timestamp
        config['res_dir'] = res_root / f"results_{timestamp}"
        config['do_cleanup_distributed'] = (i == len(configs) - 1)
        run(**config)