from joblib import Parallel, delayed
from itertools import product
import subprocess
import multiprocessing
import os
os.environ["MKL_SERVICE_FORCE_INTEL"] = "1"

def run_command(command):
    """
    Function to run a command.
    """
    subprocess.run(command, shell=True)
    
def generate_commands(base_command, params):
    """
    Generate a list of commands based on the base command and parameters.
    """
    keys = list(params.keys())
    values = list(params.values())
    # Generate all combinations of parameters
    combinations = list(product(*values))
    commands = []
    for combination in combinations:
        command = base_command
        for key, value in zip(keys, combination):
            command += f" {key}={value}"
        commands.append(command)
    return commands

def create_all_commands():
    
    # TODO Should we use SWEEP if we don't want hyper-parameter tuning?
    # SWEEP='sweep=TRAIN'

    BASE_ARGS='arch=mlp proj_name=ablation_train wandb=true task=shuffle_cifar10 monitor_forward_transfer=false monitor_backward_transfer=false'
    
    base_command_str = f'python main_sl.py {BASE_ARGS}'
    
    num_seeds = 1

    list_of_configs = [
                       #'agent.WC=false',
                       #'agent.SM=false',
                       #'agent.AL=false',
                       'agent.ARM=false',
                       #'agent.SM_detach=true'
                       ]
    
    commands = []
    for item in list_of_configs:
    
    # Batch 11- NeuroSync
        command_str = f'{base_command_str} agent=neuro_sync {item}'
        params = {
            'seed': [str(i) for i in range(num_seeds)],
        }
        params = {
            **params
        }
        commands += generate_commands(command_str, params)
    
    return commands

if __name__ == "__main__":
    
   
    commands = create_all_commands()
    #print("Commands", commands)
    print("Num commands", len(commands))
    # Using joblib to parallelize the execution
    num_cores = multiprocessing.cpu_count() 
    if num_cores >= 4:
        num_cores = num_cores // 2
    Parallel(n_jobs=num_cores)(delayed(run_command)(command) for command in commands)