from data_provider.data_loader import Dataset_ETT_hour, Dataset_ETT_minute, Dataset_Custom, Dataset_M4, PSMSegLoader, \
    MSLSegLoader, SMAPSegLoader, SMDSegLoader, SWATSegLoader, UEAloader, Monashloader, Noisy_UEAloader
from data_provider.uea import collate_fn
from torch.utils.data import DataLoader

data_dict = {
    # 'ETTh1': Dataset_ETT_hour,
    # 'ETTh2': Dataset_ETT_hour,
    # 'ETTm1': Dataset_ETT_minute,
    # 'ETTm2': Dataset_ETT_minute,
    # 'custom': Dataset_Custom,
    # 'm4': Dataset_M4,
    # 'PSM': PSMSegLoader,
    # 'MSL': MSLSegLoader,
    # 'SMAP': SMAPSegLoader,
    # 'SMD': SMDSegLoader,
    # 'SWAT': SWATSegLoader,
    'UEA': UEAloader,
    'Noisy_UEA': Noisy_UEAloader,
    # 'Monash': Monashloader
}


def data_provider(args, flag, bin_edges=None):
    Data = data_dict[args.data]
    timeenc = 0 if args.embed != 'timeF' else 1
    # flag = flag.lower()

    if flag == 'test' or flag == 'TEST':
        print("Testing mode: setting shuffle=False", 1, args.freq)
        shuffle_flag = False
        drop_last = True
        if args.task_name == 'anomaly_detection' or args.task_name == 'classification':
            batch_size = args.batch_size
        else:
            batch_size = 1  # bsz=1 for evaluation
        freq = args.freq
    else:
        print("Training mode: setting shuffle=True", args.batch_size, args.freq)
        shuffle_flag = True
        drop_last = True
        batch_size = args.batch_size  # bsz for train and valid
        freq = args.freq
    if args.task_name == 'explanation':
        print("Explanation generation mode: setting batch_size=1, shuffle=False")
        shuffle_flag = False # No shuffling for explanation generation, Very important! Since we use order in the save file to evaluate !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! ******************** !!!!!!!!!!!!!!!!!!!!
        drop_last = False
        batch_size = args.batch_size  # bsz for train and valid
        freq = args.freq
    # print(flag, flag== 'test', batch_size, freq)
    # exit()


    if args.task_name == 'anomaly_detection':
        drop_last = False
        data_set = Data(
            root_path=args.root_path,
            win_size=args.seq_len,
            flag=flag,
        )
        print(flag, len(data_set))
        data_loader = DataLoader(
            data_set,
            batch_size=batch_size,
            shuffle=shuffle_flag,
            num_workers=args.num_workers,
            drop_last=drop_last)
        return data_set, data_loader
    elif args.task_name == 'classification' or args.task_name == 'explanation':
        drop_last = False
        data_set = Data(
            root_path=args.root_path,
            flag=flag,
        )

        data_loader = DataLoader(
            data_set,
            batch_size=batch_size,
            shuffle=shuffle_flag,
            num_workers=args.num_workers,
            drop_last=drop_last,
            collate_fn=lambda x: collate_fn(x, max_len=args.seq_len)
        )
        return data_set, data_loader
    elif args.task_name == 'regression':
        drop_last = False
        data_set = Data(
            root_path=args.root_path,
            flag=flag,
            bin_edges=bin_edges
        )
        data_loader = DataLoader(
            data_set,
            batch_size=batch_size,
            shuffle=shuffle_flag,
            num_workers=args.num_workers,
            drop_last=drop_last,
            collate_fn=lambda x: collate_fn(x, max_len=args.seq_len)
        )
        return data_set, data_loader
    else:
        if args.data == 'm4':
            drop_last = False
        data_set = Data(
            root_path=args.root_path,
            data_path=args.data_path,
            flag=flag,
            size=[args.seq_len, args.label_len, args.pred_len],
            features=args.features,
            target=args.target,
            timeenc=timeenc,
            freq=freq,
            seasonal_patterns=args.seasonal_patterns
        )
        print(flag, len(data_set))
        data_loader = DataLoader(
            data_set,
            batch_size=batch_size,
            shuffle=shuffle_flag,
            num_workers=args.num_workers,
            drop_last=drop_last)
        return data_set, data_loader


def noisy_data_provider(args, flag, bin_edges=None):
    Data = data_dict['Noisy_UEA']
    timeenc = 0 if args.embed != 'timeF' else 1
    # flag = flag.lower()

    if flag == 'test' or flag == 'TEST':
        print("Testing mode: setting shuffle=False", 1, args.freq)
        shuffle_flag = False
        drop_last = True
        if args.task_name == 'anomaly_detection' or args.task_name == 'classification':
            batch_size = args.batch_size
        else:
            batch_size = 1  # bsz=1 for evaluation
        freq = args.freq
    else:
        print("Training mode: setting shuffle=True", args.batch_size, args.freq)
        shuffle_flag = True
        drop_last = True
        batch_size = args.batch_size  # bsz for train and valid
        freq = args.freq
    if args.task_name == 'explanation':
        print("Explanation generation mode: setting batch_size=1, shuffle=False")
        shuffle_flag = False # No shuffling for explanation generation, Very important! Since we use order in the save file to evaluate !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! ******************** !!!!!!!!!!!!!!!!!!!!
        drop_last = False
        batch_size = args.batch_size  # bsz for train and valid
        freq = args.freq
    # print(flag, flag== 'test', batch_size, freq)
    # exit()


    if args.task_name == 'anomaly_detection':
        drop_last = False
        data_set = Data(
            root_path=args.root_path,
            win_size=args.seq_len,
            flag=flag,
        )
        print(flag, len(data_set))
        data_loader = DataLoader(
            data_set,
            batch_size=batch_size,
            shuffle=shuffle_flag,
            num_workers=args.num_workers,
            drop_last=drop_last)
        return data_set, data_loader
    elif args.task_name == 'classification' or args.task_name == 'explanation':
        drop_last = False
        data_set = Data(
            root_path=args.root_path,
            flag=flag,
        )

        data_loader = DataLoader(
            data_set,
            batch_size=batch_size,
            shuffle=shuffle_flag,
            num_workers=args.num_workers,
            drop_last=drop_last,
            collate_fn=lambda x: collate_fn(x, max_len=args.seq_len)
        )
        return data_set, data_loader
    elif args.task_name == 'regression':
        drop_last = False
        data_set = Data(
            root_path=args.root_path,
            flag=flag,
            bin_edges=bin_edges
        )
        data_loader = DataLoader(
            data_set,
            batch_size=batch_size,
            shuffle=shuffle_flag,
            num_workers=args.num_workers,
            drop_last=drop_last,
            collate_fn=lambda x: collate_fn(x, max_len=args.seq_len)
        )
        return data_set, data_loader
    else:
        if args.data == 'm4':
            drop_last = False
        data_set = Data(
            root_path=args.root_path,
            data_path=args.data_path,
            flag=flag,
            size=[args.seq_len, args.label_len, args.pred_len],
            features=args.features,
            target=args.target,
            timeenc=timeenc,
            freq=freq,
            seasonal_patterns=args.seasonal_patterns
        )
        print(flag, len(data_set))
        data_loader = DataLoader(
            data_set,
            batch_size=batch_size,
            shuffle=shuffle_flag,
            num_workers=args.num_workers,
            drop_last=drop_last)
        return data_set, data_loader

