import numpy as np
import os
import datetime
import collections
from os.path import dirname, abspath
from copy import deepcopy
from sacred import Experiment, SETTINGS
from sacred.observers import FileStorageObserver
from sacred.utils import apply_backspaces_and_linefeeds
import sys
import torch as th
from utils.logging import get_logger
import yaml
import swanlab
os.environ["WANDB_API_KEY"] = ""
os.environ["SWANLAB_API_KEY"] = ""
os.environ["SC2PATH"] = ""
os.environ['SUPPRESS_GR_PROMPT'] = '1'
# import run program
from run import run as run
from collect_data import run as collect_data
from offline_run import run as offline_run
from offline_meta_run import run as offline_meta_run
from offline_continuous_run import run as offline_cont_run
from offline_role_prior_run import run as offline_role_prior_run

from swanlab import Settings

# 创建新的设置对象
new_settings = Settings(
    log_proxy_type="stdout",
)
swanlab.merge_settings(new_settings)

SETTINGS['CAPTURE_MODE'] = "fd" # set to "no" if you want to see stdout/stderr in console
logger = get_logger()

ex = Experiment("OfflineMARL", save_git_info=False)
ex.logger = logger
ex.captured_out_filter = apply_backspaces_and_linefeeds

results_path = os.path.join(dirname(dirname(abspath(__file__))), "results")


@ex.main
def my_main(_run, _config, _log):
    # Setting the random seed throughout the modules
    config = config_copy(_config)
    np.random.seed(config["seed"])
    th.manual_seed(config["seed"])
    config['env_args']['seed'] = config["seed"]

    # run the framework
    match config['run_file']:
        case 'online':
            run(_run, config, _log)
        case "collect":
            collect_data(_run, config, _log)
        case "offline_role_prior":
            offline_role_prior_run(_run, config, _log)
        case "offline":
            if config["env"] == "mujoco":
                offline_cont_run(_run, config, _log)
            else:
                offline_run(_run, config, _log)
        case "offline_meta":
            offline_meta_run(_run, config, _log)
        case _: 
            raise NotImplementedError("hhhh")
    
    swanlab.finish()


def _get_config(params, arg_name, subfolder):
    config_name = None
    for _i, _v in enumerate(params):
        if _v.split("=")[0] == arg_name:
            config_name = _v.split("=")[1]
            del params[_i]
            break
    
    if config_name is not None:
        with open(os.path.join(os.path.dirname(__file__), "config", subfolder, "{}.yaml".format(config_name)), "r") as f:
            try:
                config_dict = yaml.safe_load(f)
            except yaml.YAMLError as exc:
                assert False, "{}.yaml error: {}".format(config_name, exc)

        return config_dict
    else: # e.g. collect_data but not assign task config
        return {}

def _get_run_file(params):
    # --run/--collect/--
    run_file = ''
    for _i, _v in enumerate(params):
        if _v.startswith('--') and '=' not in _v:
            run_file = _v[2:]
            del params[_i]
            return run_file
    return run_file

def recursive_dict_update(d, u):
    for k, v in u.items():
        if isinstance(v, collections.abc.Mapping):
            d[k] = recursive_dict_update(d.get(k, {}), v)
        else:
            d[k] = v
    return d

def config_copy(config):
    if isinstance(config, dict):
        return {k: config_copy(v) for k, v in config.items()}
    elif isinstance(config, list):
        return [config_copy(v) for v in config]
    else:
        return deepcopy(config)

# get config from argv, such as "remark"
def _get_argv_config(params):
    config = {}
    to_del = []
    for _i, _v in enumerate(params):
        item = _v.split("=")[0]
        if item[:2] == "--" and item not in ["envs", "algs"]:
            config_v = _v.split("=")[1]
            try:
                config_v = eval(config_v)
            except:
                pass
            config[item[2:]] = config_v
            to_del.append(_v)
    for _v in to_del:
        params.remove(_v)
    return config

if __name__ == '__main__':
    params = deepcopy(sys.argv)

    # Get the defaults from default.yaml
    with open(os.path.join(os.path.dirname(__file__), "config", "default.yaml"), "r") as f:
        try:
            config_dict = yaml.safe_load(f)
        except yaml.YAMLError as exc:
            assert False, "default.yaml error: {}".format(exc)

    # read the run file
    run_file = _get_run_file(params)
    config_dict['run_file'] = run_file

    # Load algorithm base configs
    alg_config = _get_config(params, "--config", "algs")
    # config_dict = {**config_dict, **alg_config}
    config_dict = recursive_dict_update(config_dict, alg_config)

    # get env type and load env config
    env_config = _get_config(params, "--env-config", "envs")
    config_dict = recursive_dict_update(config_dict, env_config)

    
    config_dict = recursive_dict_update(config_dict, _get_argv_config(params))
    
    ### TODO: adding MuJoCo
    # test match in python 3.10.x
    match config_dict["env"]:
        case "sc2":
            # overwrite map_name config
            if "map_name" in config_dict:
                config_dict["env_args"]["map_name"] = config_dict["map_name"]
        case "sc2_v2":
            # overwrite map_name config
            if "task" in config_dict:
                config_dict["env_args"]["task"] = config_dict["task"]
                if "terran" in config_dict["task"]:
                    config_dict["env_args"]["map_name"] = "10gen_terran"
                elif "protoss" in config_dict["task"]:
                    config_dict["env_args"]["map_name"] = "10gen_protoss"
                elif "zerg" in config_dict["task"]:
                    config_dict["env_args"]["map_name"] = "10gen_zerg"
                else:
                    assert False
        case "gymma":
            if "key" in config_dict:
                config_dict["env_args"]["key"] = config_dict["key"]
            if "time_limit" in config_dict:
                config_dict["env_args"]["time_limit"] = config_dict["time_limit"]
            if "pretrained_wrapper" in config_dict:
                config_dict["env_args"]["pretrained_wrapper"] = config_dict["pretrained_wrapper"]
        case "mt_grid_mpe":
            if "task_id" in config_dict:
                config_dict["env_args"]["task_id"] = config_dict["task_id"]
        case "mujoco":
            if "scenario" in config_dict:
                config_dict["env_args"]["scenario"] = config_dict["scenario"]
            if "agent_conf" in config_dict:
                config_dict["env_args"]["agent_conf"] = config_dict["agent_conf"]
        case _:
            raise NotImplementedError("Not support env: {}".format(config_dict["env"]))
        
    # get result path
    if 'remark' in config_dict:
        config_dict['remark'] = '_' + config_dict['remark']
    else:
        config_dict['remark'] = ''

    # result_dir_format: {run_file}/{Y_M_D}/.../{remark}/{seed}_{HMS}
    Y_M_D, H_M_S = datetime.datetime.now().strftime("%Y_%m_%d %H_%M_%S").split()
    unique_token = "seed_{}_{}".format(config_dict['seed'], H_M_S)

    config_dict['unique_token'] = unique_token

    match config_dict["env"]:
        case "sc2":
            env, map_name = config_dict["env"], config_dict["env_args"]["map_name"]
            if "total_task_ls" in config_dict.keys():
                if "12m" in config_dict["total_task_ls"]:
                    env = env + "_marine_easy"
                elif "13m_vs_15m" in config_dict["total_task_ls"]:
                    env = env + "_marine_hard"
                elif "2s3z" in config_dict["total_task_ls"]:
                    env = env + "_stalker_zealot"
        case "sc2_v2":
            env, map_name, task_name = config_dict["env"], config_dict["env_args"]["map_name"], config_dict["env_args"]["task"]
            if "total_task_ls" in config_dict.keys():
                if "terran_5_vs_5_meta1" in config_dict["total_task_ls"]:
                    env = env + "_terran"
                elif "protoss_5_vs_5_meta1" in config_dict["total_task_ls"]:
                    env = env + "_protoss"
                elif "zerg_5_vs_5_meta1" in config_dict["total_task_ls"]:
                    env = env + "_zerg"
                else:
                    env = env
                if "without_unit_type" in config_dict.keys():
                    env = env + "_wo_unit_type"
        case "gymma":
            env, map_name = config_dict["env_args"]["key"].split(':')
        case "mt_grid_mpe":
            env, map_name = config_dict["env"], str(config_dict["env_args"]["task_id"])
            if config_dict["num_tasks"]==4:
                env = env+"_agent"
        case "mujoco":
            env, map_name = config_dict["env"], config_dict["env_args"]["scenario"]+"-"+config_dict["env_args"]["agent_conf"]
            config_dict["env_args"]["map_name"] = map_name
        case _:
            raise NotImplementedError("Not support env: {}".format(config_dict["env"]))
    
    match config_dict['run_file']:
        case 'offline':
            if config_dict['evaluate']:
                results_path = os.path.join(results_path, 'evaluate')
            
            name = "offline"
            name_remark = config_dict['name'] + config_dict['remark']
            if config_dict["is_diffusion"]:
                if config_dict["use_rnn"]:
                    name_remark += "_rnn"
            if config_dict['use_obs_attack']:
                name += "_robust"
                results_save_dir = os.path.join(
                    results_path, name, Y_M_D, env, map_name, f"noise_scale_{config_dict['noise_scale']}",
                    config_dict['offline_data_quality'],
                    name_remark,
                    unique_token
                )
            else:
                results_save_dir = os.path.join(
                    results_path, "offline", Y_M_D, env, map_name,
                    config_dict['offline_data_quality'],
                    name_remark,
                    unique_token
                )
        case 'offline_role_prior':
            if config_dict['evaluate']:
                results_path = os.path.join(results_path, 'evaluate')
            
            name = "offline_role_prior"
            name_remark = config_dict['name'] + config_dict['remark']
            results_save_dir = os.path.join(
                results_path, "offline_role_prior", Y_M_D, env, task_name,
                config_dict['offline_data_quality'],
                name_remark,
                unique_token
            )
        case 'offline_meta':
            if config_dict['evaluate']:
                results_path = os.path.join(results_path, 'evaluate')
            
            name = "offline_meta"
            if config_dict.get("is_vae_train", False):
                if config_dict.get("is_vqvae", False):
                    name += "_vqvae"
                else:
                    name += "_vae"
                results_save_dir = os.path.join(
                    results_path, name, Y_M_D, env, map_name, f"vae_beta_{config_dict['vae_beta']}",
                    config_dict['offline_data_quality'],
                    config_dict['name'] + config_dict['remark'],
                    unique_token
                )
            elif config_dict.get("is_prior_role_encoder_train", False):
                name += "_prior_role_encoder"
                if config_dict.get("weighted_prior_learning", False):
                    results_save_dir = os.path.join(
                        results_path, name, Y_M_D, env, map_name, f"encoder_{config_dict['encoder_id']}", f"role_encoder_{config_dict['role_encoder_id']}",
                        "weighted_prior",
                        config_dict['offline_data_quality'],
                        config_dict['name'] + config_dict['remark'],
                        unique_token
                    )
                else:
                    results_save_dir = os.path.join(
                        results_path, name, Y_M_D, env, map_name, f"encoder_{config_dict['encoder_id']}", f"role_encoder_{config_dict['role_encoder_id']}",
                        config_dict['offline_data_quality'],
                        config_dict['name'] + config_dict['remark'],
                        unique_token
                    )
            elif config_dict.get("is_role_encoder_train", False):
                if config_dict["use_decoder_loss"]:
                    decoder_str = "1"
                else:
                    decoder_str = "0"
                
                name += "_role_encoder"
                if not config_dict.get("role_use_task_encoding", True):
                    results_save_dir = os.path.join(
                        results_path, name, Y_M_D, env, map_name, f"encoder_{config_dict['encoder_id']}", "use_decoder_loss", decoder_str,
                        f"info_nce_temp_{config_dict['infonce_temp']}",
                        "wo_task_encoding",
                        config_dict['offline_data_quality'],
                        config_dict['name'] + config_dict['remark'],
                        unique_token
                    )
                else:
                    results_save_dir = os.path.join(
                        results_path, name, Y_M_D, env, map_name, f"encoder_{config_dict['encoder_id']}", "use_decoder_loss", decoder_str,
                        f"info_nce_temp_{config_dict['infonce_temp']}",
                        config_dict['offline_data_quality'],
                        config_dict['name'] + config_dict['remark'],
                        unique_token
                    )
            elif config_dict.get("is_encoder_train", False):
                if config_dict["use_decoder_loss"]:
                    decoder_str = "1"
                else:
                    decoder_str = "0"
                
                if config_dict["use_mg2l"]:
                    mg2l_str = "1"
                else:
                    mg2l_str = "0"
                
                if config_dict["use_club"]:
                    club_str = "1"
                else:
                    club_str = "0"
                name += "_encoder"
                results_save_dir = os.path.join(
                    results_path, name, Y_M_D, env, map_name, config_dict['cl_loss'], "use_decoder_loss", decoder_str, "use_mg2l", mg2l_str, "use_club", club_str,
                    config_dict['offline_data_quality'],
                    config_dict['name'] + config_dict['remark'],
                    unique_token
                )
            else:
                if config_dict.get("is_meta_adaptation", False):
                    name += "_adaptation"
                    
                if config_dict['name'] == "meta_omiga_diffusion":
                    if config_dict["simple_mlp_agent"]:
                        config_dict['name'] = "meta_omiga_latent_cvae"
                    config_dict['name'] = config_dict['name'] + "_vae" + str(config_dict["vae_id"])

                if config_dict.get("use_role_encoder", False):
                    role_encoder_str = "1"
                else:
                    role_encoder_str = "0"

                config_dict["encoder_path"] = config_dict["encoder_path_ls"][config_dict["encoder_id"]]
                tmp_name = ""
                
                if not config_dict.get("is_meta_adaptation", False):
                    if config_dict.get("perturb_local_encoding", False):
                        tmp_name += f"perturb_task_encoding_scale_{config_dict['perturb_noise_scale']}"
                    if config_dict.get("only_role_encoding", False):
                        if tmp_name == "":
                            tmp_name += "only_role_encoding"
                        else:
                            tmp_name += "/only_role_encoding"

                    if config_dict.get("separate_role_encoding", False):
                        if config_dict["use_moe"]:
                            if tmp_name == "":
                                tmp_name += "separate_role_encoding_moe"
                            else:
                                tmp_name += "/separate_role_encoding_moe"
                        else:
                            if tmp_name == "":
                                tmp_name += "separate_role_encoding"
                            else:
                                tmp_name += "/separate_role_encoding"
                    if tmp_name == "":
                        tmp_name = "perturb_task_encoding_False"
                else:
                    if config_dict.get("use_idaq", False):
                        tmp_name = "idaq"
                    else:
                        tmp_name = "encoding_mean"
                    
                    if config_dict.get("collect_with_idaq", False):
                        tmp_name += "/collect_with_idaq"
                    
                    if config_dict.get("collect_with_best_role", False):
                        tmp_name += "/collect_with_best_role_after_"+str(config_dict["prior_role_collect_episode"])
                    
                    tmp_name += f"/policy_{config_dict['policy_id']}"

                if config_dict.get('train_with_prior_encoding_p', False):
                    results_save_dir = os.path.join(
                        results_path, name, Y_M_D, env, "use_role_encoder", role_encoder_str,"encoder_"+str(config_dict["encoder_id"]), "role_encoder_"+str(config_dict["role_encoder_id"]), "prior_role_encoder_"+str(config_dict["prior_role_encoder_id"]),
                        tmp_name,
                        f"train_prior_p_{config_dict['train_with_prior_encoding_p']}",
                        config_dict['offline_data_quality'],
                        config_dict['name'] + config_dict['remark'],
                        unique_token
                    )
                else:
                    results_save_dir = os.path.join(
                        results_path, name, Y_M_D, env, "use_role_encoder", role_encoder_str,"encoder_"+str(config_dict["encoder_id"]), "role_encoder_"+str(config_dict["role_encoder_id"]), "prior_role_encoder_"+str(config_dict["prior_role_encoder_id"]),
                        tmp_name,
                        config_dict['offline_data_quality'],
                        config_dict['name'] + config_dict['remark'],
                        unique_token
                    )

        case "collect":
            if (env == "sc2" or env == "sc2_v2") and config_dict["stop_winrate"] > 0:    
                aux_dir = f"stop_win_rate_{config_dict['stop_winrate']}"
            else:
                aux_dir = f"stop_return_{config_dict['stop_return']}"
            results_save_dir = os.path.join(
                results_path, "collect", Y_M_D,
                env + os.sep + task_name,
                config_dict['offline_data_quality'], aux_dir,
                config_dict['name'] + config_dict['remark'],
                unique_token
            )
        case "online":
            if config_dict['evaluate']:
                results_path = os.path.join(results_path, 'evaluate')
            results_save_dir = os.path.join(
                results_path, "run_online", Y_M_D,
                env + os.sep + map_name, 
                config_dict['name'] + config_dict['remark'],
                unique_token
            )
        case _:
            raise NotImplementedError("Not support run_file: {}".format(config_dict['run_file']))
                                  
    os.makedirs(results_save_dir, exist_ok=True)
    config_dict['results_save_dir'] = results_save_dir
    #config_dict['pretrain_save_dir'] = os.path.join(dirname(results_save_dir), 'pretrain-models')

    # Save to disk by default for sacred
    file_obs_path = os.path.join(results_save_dir, "sacred")
    ex.observers.append(FileStorageObserver.create(file_obs_path))
    logger.info("Saving to FileStorageObserver in {}.".format(file_obs_path))
    # now add all the config to sacredd
    ex.add_config(config_dict)
    ex.run_commandline(params)
