import os
from data_provider.data_loader import Dataset_ETT_hour, Dataset_Custom, Dataset_ETT_minute
from torch.utils.data import DataLoader
from torch.utils.data.distributed import DistributedSampler

from data_provider.data_loader_benchmark import CIAutoRegressionDatasetBenchmark

data_dict = {
    'ETTh1': Dataset_ETT_hour,
    'ETTh2': Dataset_ETT_hour,
    'ETTm1': Dataset_ETT_minute,
    'ETTm2': Dataset_ETT_minute,
    'custom': Dataset_Custom,
}


def data_provider(args, flag):
    Data = data_dict[args.data]
    timeenc = 0 if args.embed != 'timeF' else 1
    freq = args.freq

    shuffle_flag = False
    drop_last = args.drop_last
    batch_size = args.batch_size 

    if not args.nonautoregressive:
        data_set = CIAutoRegressionDatasetBenchmark(
            root_path=os.path.join(args.root_path, args.data_path),
            flag=flag,
            input_len=args.seq_len,
            label_len=args.label_len,
            pred_len=args.output_len if flag == 'test' else args.pred_len,
            data_type=args.data,
            scale=True,
            timeenc=timeenc,
            freq=freq,
            stride=args.stride,
            subset_rand_ratio=args.subset_rand_ratio,
        )
    else:
        data_set = Data(
            args = args,
            root_path=args.root_path,
            data_path=args.data_path,
            flag=flag,
            size=[args.seq_len, args.label_len, args.output_len],
            features=args.features,
            seasonal_patterns=args.seasonal_patterns,
            drop_short=args.drop_short,
            freq=freq,
        )
    if (args.use_multi_gpu and args.local_rank == 0) or not args.use_multi_gpu:
        print(flag, len(data_set))
    if args.use_multi_gpu:
        train_datasampler = DistributedSampler(data_set, shuffle=shuffle_flag)
        data_loader = DataLoader(data_set, 
            batch_size=batch_size,
            sampler=train_datasampler,
            num_workers=args.num_workers,
            persistent_workers=True,
            pin_memory=True,
            )
    else:
        data_loader = DataLoader(
            data_set,
            batch_size=batch_size,
            shuffle=shuffle_flag,
            num_workers=args.num_workers,
            drop_last=drop_last)
    return data_set, data_loader