'''
export OMP_NUM_THREADS=16 && torchrun --nproc_per_node=8 -m src.run.orchestrate.experiment.exp_06_hyperparam_realistic
'''

from src.run.orchestrate.config import RealisticBaseArgs, calc_realistic_model_params
from src.run.utils import get_timestamp
from src.run.main import run

from pathlib import Path
from copy import deepcopy

if __name__ == '__main__':
    
    base_args = deepcopy(RealisticBaseArgs)
    configs = []

    root_dir = Path("src").absolute()
    res_root = root_dir / f"results/realistic/06/combined_{get_timestamp()}"
    do_checkpoint = False

    base_args['aux_labels'] = ["bigcode", "biology", "nuclear", "cyber"]
    base_args['stages'] = [
        {
            "name": "routed", "arch": "moe", "ordered": False, "ft_forget": False, 
            "aux_route_prc": 0.75, "robust_prc": 0.05, "expert_dist": "prc_one",
            "do_checkpoint": do_checkpoint,
        }
    ]

    model_params = calc_realistic_model_params(700e6)
    base_args.update(model_params)
    base_args['seed'] = 42

    aux_route_prcs = [0.0, 0.25, 0.5, 0.75, 1.0]
    for aux_route_prc in aux_route_prcs:
        run_config = deepcopy(base_args)
        run_config["stages"][0]["aux_route_prc"] = aux_route_prc
        run_config["stages"][0]["robust_prc"] = 0.05
        configs.append(run_config)

    for i, config in enumerate(configs):
        timestamp = get_timestamp()
        config['timestamp'] = timestamp
        config['res_dir'] = res_root / f"results_{timestamp}"
        config['do_cleanup_distributed'] = (i == len(configs) - 1)
        run(**config)