import os
import yaml
from yacs.config import CfgNode as CN

_C = CN()

# Base config files
_C.BASE = [""]

# -----------------------------------------------------------------------------
# Data settings
# -----------------------------------------------------------------------------
_C.DATA = CN()
# Batch size for a single GPU, could be overwritten by command line argument
_C.DATA.BATCH_SIZE = 32
# Path to dataset, could be overwritten by command line argument
_C.DATA.DATA_PATH = ""
# Dataset name
_C.DATA.DATASET = "livec"
# Aug images
_C.DATA.PATCH_NUM = 25
# Input image size
_C.DATA.IMG_SIZE = 224
# Random crop image size
_C.DATA.CROP_SIZE = (224, 224)
# Use zipped dataset instead of folder dataset
# could be overwritten by command line argument
_C.DATA.ZIP_MODE = False
# Cache Data in Memory, could be overwritten by command line argument
_C.DATA.CACHE_MODE = "part"
# Pin CPU memory in DataLoader for more efficient (sometimes) transfer to GPU.
_C.DATA.PIN_MEMORY = True
# Number of data loading threads
_C.DATA.NUM_WORKERS = 4
# -----------------------------------------------------------------------------
# SET settings
# -----------------------------------------------------------------------------
_C.SET = CN()
# K10K: 10073 LIVEC: 1162
_C.SET.COUNT = 1162
_C.SET.TRAIN_INDEX = None
_C.SET.TEST_INDEX = None
# -----------------------------------------------------------------------------
# Model settings
# -----------------------------------------------------------------------------
_C.MODEL = CN()
# Model type
_C.MODEL.TYPE = "swin"
# Model name
_C.MODEL.NAME = "swin_tiny_patch4_window7_224"
# Pretrained weight from checkpoint, could be imagenet22k pretrained weight
# could be overwritten by command line argument
_C.MODEL.PRETRAINED = ""
# Checkpoint to resume, could be overwritten by command line argument
_C.MODEL.RESUME = ""
# Number of classes, overwritten in data preparation
_C.MODEL.NUM_CLASSES = 1
# Dropout rate
_C.MODEL.DROP_RATE = 0.0
# Drop path rate
_C.MODEL.DROP_PATH_RATE = 0.1

# DeiT III
_C.MODEL.VIT = CN()
_C.MODEL.VIT.PATCH_SIZE = 16
_C.MODEL.VIT.EMBED_DIM = 384
_C.MODEL.VIT.DEPTH = 12
_C.MODEL.VIT.NUM_HEADS = 6
_C.MODEL.VIT.MLP_RATIO = 4
_C.MODEL.VIT.QKV_BIAS = True
_C.MODEL.VIT.PRETRAINED = True
_C.MODEL.VIT.PRETRAINED_MODEL_PATH = ""
_C.MODEL.VIT.CROSS_VALID = False
_C.MODEL.VIT.CROSS_MODEL_PATH = ""

# LNN
_C.MODEL.LNN = CN()
_C.MODEL.LNN.IN_CHANS = 3
_C.MODEL.LNN.EMBED_DIM = 96
_C.MODEL.LNN.DEPTHS = [2, 2, 6, 2]
_C.MODEL.LNN.NUM_HEADS = [3, 6, 12, 24]
_C.MODEL.LNN.WINDOW_SIZE = 7
_C.MODEL.LNN.IMG_SIZE = 224
_C.MODEL.LNN.NUM_CLASSES = 1000
# _C.MODEL.LNN.RETURN_INTERM_LAYERS = True
_C.MODEL.LNN.PRETRAINED = True
_C.MODEL.LNN.PRETRAINED_MODEL_PATH = ""
_C.MODEL.LNN.CROSS_VALID = False
_C.MODEL.LNN.CROSS_MODEL_PATH = ""

# LiquidSwinIQA
_C.MODEL.LIQUIDSWIN_IQA = CN()
_C.MODEL.LIQUIDSWIN_IQA.IMG_SIZE = 224
_C.MODEL.LIQUIDSWIN_IQA.PATCH_SIZE = 4
_C.MODEL.LIQUIDSWIN_IQA.IN_CHANS = 3
_C.MODEL.LIQUIDSWIN_IQA.EMBED_DIM = 96
_C.MODEL.LIQUIDSWIN_IQA.DEPTHS = [2, 2, 6, 2]
_C.MODEL.LIQUIDSWIN_IQA.NUM_HEADS = [3, 6, 12, 24]
_C.MODEL.LIQUIDSWIN_IQA.WINDOW_SIZE = 7
_C.MODEL.LIQUIDSWIN_IQA.MLP_RATIO = 4.0
_C.MODEL.LIQUIDSWIN_IQA.USE_MULTI_SCALE = True
_C.MODEL.LIQUIDSWIN_IQA.DROPOUT = 0.1
_C.MODEL.LIQUIDSWIN_IQA.NUM_REGRESSION_HEADS = 1
_C.MODEL.LIQUIDSWIN_IQA.RETURN_INTERM_LAYERS = True
_C.MODEL.LIQUIDSWIN_IQA.PRETRAINED = True
_C.MODEL.LIQUIDSWIN_IQA.PRETRAINED_MODEL_PATH = ""
_C.MODEL.LIQUIDSWIN_IQA.CROSS_VALID = False
_C.MODEL.LIQUIDSWIN_IQA.CROSS_MODEL_PATH = ""

# Hor
_C.MODEL.HOR = CN()
_C.MODEL.HOR.PRETRAINED = True
_C.MODEL.HOR.PRETRAINED_MODEL_PATH = ""

# COC
_C.MODEL.COC = CN()
_C.MODEL.COC.PRETRAINED = True
_C.MODEL.COC.PRETRAINED_MODEL_PATH = ""
_C.MODEL.COC.CROSS_VALID = False
_C.MODEL.COC.CROSS_MODEL_PATH = ""

# -----------------------------------------------------------------------------
# Training settings
# -----------------------------------------------------------------------------
_C.TRAIN = CN()
_C.TRAIN.START_EPOCH = 0
_C.TRAIN.EPOCHS = 300
_C.TRAIN.WARMUP_EPOCHS = 20
_C.TRAIN.WEIGHT_DECAY = 0.05
_C.TRAIN.BASE_LR = 5e-4
_C.TRAIN.WARMUP_LR = 5e-7
_C.TRAIN.MIN_LR = 5e-6
# Clip gradient norm
_C.TRAIN.CLIP_GRAD = 5.0
# Auto resume from latest checkpoint
_C.TRAIN.AUTO_RESUME = True
# Gradient accumulation steps
# could be overwritten by command line argument
_C.TRAIN.ACCUMULATION_STEPS = 1
# Whether to use gradient checkpointing to save memory
# could be overwritten by command line argument
_C.TRAIN.USE_CHECKPOINT = False

# LR scheduler
_C.TRAIN.LR_SCHEDULER = CN()
_C.TRAIN.LR_SCHEDULER.NAME = "cosine"
# Epoch interval to decay LR, used in StepLRScheduler
_C.TRAIN.LR_SCHEDULER.DECAY_EPOCHS = 30
# LR decay rate, used in StepLRScheduler
_C.TRAIN.LR_SCHEDULER.DECAY_RATE = 0.1

# Optimizer
_C.TRAIN.OPTIMIZER = CN()
_C.TRAIN.OPTIMIZER.NAME = "adamw"
# Optimizer Epsilon
_C.TRAIN.OPTIMIZER.EPS = 1e-8
# Optimizer Betas
_C.TRAIN.OPTIMIZER.BETAS = (0.9, 0.999)
# SGD momentum
_C.TRAIN.OPTIMIZER.MOMENTUM = 0.9

# -----------------------------------------------------------------------------
# Testing settings
# -----------------------------------------------------------------------------
_C.TEST = CN()
# Whether to use SequentialSampler as validation sampler
_C.TEST.SEQUENTIAL = False

# -----------------------------------------------------------------------------
# Misc
# -----------------------------------------------------------------------------
# Enable Pytorch automatic mixed precision (amp).
_C.AMP_ENABLE = True
# [Deprecated] Mixed precision opt level of apex, if O0, no apex amp is used ('O0', 'O1', 'O2')
_C.AMP_OPT_LEVEL = ""
# Path to output folder, overwritten by command line argument
_C.OUTPUT = ""
# Tag of experiment, overwritten by command line argument
_C.TAG = "default"
# Frequency to save checkpoint
_C.SAVE_FREQ = 1
# Disable saving feature to save disk space
_C.DISABLE_SAVE = False
# Frequency to logging info
_C.PRINT_FREQ = 10
# Fixed random seed
_C.SEED = 0
# Perform evaluation only, overwritten by command line argument
_C.EVAL_MODE = False
# Test throughput only, overwritten by command line argument
_C.THROUGHPUT_MODE = False
# Use torchinfo to show the flow
_C.DEBUG_MODE = False
# Repeat exps for publications
_C.EXP_INDEX = 0
# local rank for DistributedDataParallel, given by command line argument
_C.LOCAL_RANK = 0
# for acceleration
_C.FUSED_WINDOW_PROCESS = True


def _update_config_from_file(config, cfg_file):
    config.defrost()
    with open(cfg_file, "r") as f:
        yaml_cfg = yaml.load(f, Loader=yaml.FullLoader)

    for cfg in yaml_cfg.setdefault("BASE", [""]):
        if cfg:
            _update_config_from_file(
                config, os.path.join(os.path.dirname(cfg_file), cfg)
            )
    print("=> merge config from {}".format(cfg_file))
    config.merge_from_file(cfg_file)
    config.freeze()


def update_config(config, args, local_rank):
    _update_config_from_file(config, args.cfg)

    config.defrost()
    if args.opts:
        config.merge_from_list(args.opts)

    # merge from specific arguments
    if args.batch_size:
        config.DATA.BATCH_SIZE = args.batch_size
    if args.data_path:
        config.DATA.DATA_PATH = args.data_path
    if args.zip:
        config.DATA.ZIP_MODE = True
    if args.cache_mode:
        config.DATA.CACHE_MODE = args.cache_mode
    if args.pretrained:
        config.MODEL.PRETRAINED = args.pretrained
    if args.resume:
        config.MODEL.RESUME = args.resume
    if args.accumulation_steps:
        config.TRAIN.ACCUMULATION_STEPS = args.accumulation_steps
    if args.use_checkpoint:
        config.TRAIN.USE_CHECKPOINT = True
    if args.amp_opt_level:
        print("[warning] Apex amp has been deprecated, please use pytorch amp instead!")
        if args.amp_opt_level == "O0":
            config.AMP_ENABLE = False
    if args.disable_amp:
        config.AMP_ENABLE = False
    if args.output:
        config.OUTPUT = args.output
    if args.tag:
        config.TAG = args.tag
    if args.eval:
        config.EVAL_MODE = True
    if args.throughput:
        config.THROUGHPUT_MODE = True
    if args.debug:
        config.DEBUG_MODE = True

    # set local rank for distributed training
    config.LOCAL_RANK = local_rank

    # output folder
    config.OUTPUT = os.path.join(config.OUTPUT, config.MODEL.NAME, config.TAG)

    config.freeze()


def get_config(args, local_rank):
    """Get a yacs CfgNode object with default values."""
    # Return a clone so that the defaults will not be altered
    # This is for the "local variable" use pattern
    config = _C.clone()
    update_config(config, args, local_rank)

    return config
