import pickle
import time

import numpy as np
import torch
import tqdm

from pcdet.models import load_data_to_gpu
from pcdet.utils import common_utils
from pcdet.models.model_utils.dsnorm import set_ds_target

import statistics

def statistics_info(cfg, ret_dict, metric, disp_dict):
    for cur_thresh in cfg.MODEL.POST_PROCESSING.RECALL_THRESH_LIST:
        metric['recall_roi_%s' % str(cur_thresh)] += ret_dict.get('roi_%s' % str(cur_thresh), 0)
        metric['recall_rcnn_%s' % str(cur_thresh)] += ret_dict.get('rcnn_%s' % str(cur_thresh), 0)
    metric['gt_num'] += ret_dict.get('gt', 0)
    min_thresh = cfg.MODEL.POST_PROCESSING.RECALL_THRESH_LIST[0]
    disp_dict['recall_%s' % str(min_thresh)] = \
        '(%d, %d) / %d' % (metric['recall_roi_%s' % str(min_thresh)], metric['recall_rcnn_%s' % str(min_thresh)], metric['gt_num'])


def add_avg_performance(dataset, result_dict):

    dataset_name = dataset.dataset_cfg['DATASET']

    avg_types = ['3d', 'bev', 'image'] \
        if dataset_name == 'KittiDataset' else ['3d', 'bev', 'image']

    # avg_class_names = ['Car', 'Pedestrian', 'Cyclist']
    avg_class_names = dataset.class_names
    map_name_to_kitti = {
        'Vehicle': 'Car',
        'Pedestrian': 'Pedestrian',
        'Cyclist': 'Cyclist',
        'car': 'Car',
        'pedestrian': 'Pedestrian',
        'cyclist': 'Cyclist',
        'motorcycle': 'Cyclist',
        'Car': 'Car',
        'Pedestrian': 'Pedestrian',
        'car': 'Car',
        'pedestrian': 'Pedestrian',
        'motorcycle': 'Cyclist',
        'bicycle': 'Cyclist',
    }
    avg_class_names = [map_name_to_kitti[name] for name in avg_class_names]
    print('avg_class_names:', avg_class_names)

    difficulty_levels = ['easy', 'moderate', 'hard']

    print(dataset_name)
    if dataset.dataset_cfg.get('EVAL_METRIC', None):
        dataset_name = dataset.dataset_cfg['EVAL_METRIC']
    print(dataset_name)
    if dataset_name == 'KittiDataset' or dataset_name == 'NuScenesDataset' or dataset_name == 'KittiDatasetMT' or dataset_name == 'NuScenesDatasetMT':
        for type in avg_types:
            for difficulty in difficulty_levels:
                new_key = 'Average/{}_{}_R40'.format(type, difficulty)
                new_value = [selected_key for selected_key in
                             result_dict.keys() if
                             type in selected_key and difficulty in selected_key]
                new_value = [result_dict[i] for i in new_value]

                new_value = sum(new_value) / len(new_value) if len(
                    new_value) != 0 else 0
                result_dict[new_key] = new_value
                # Compute Harmonic_mean
                print(result_dict.keys())
                class_keys = ['{}_{}/{}_R40'.format(cls, type, difficulty) for cls in avg_class_names]
                print(class_keys)
                results_per_class = [result_dict[key] for key in class_keys]
                # print(results_per_class)
                new_key = 'Harmonic_mean/{}_{}_R40'.format(type, difficulty)
                new_value = statistics.harmonic_mean(results_per_class)
                # print(new_value)
                result_dict[new_key] = new_value

    elif dataset_name == 'WaymoDataset':
        avg_types = ['AP', 'APH']
        avg_class_names = dataset.class_names
        difficulty_levels = ['Level_1', 'Level_2']
        for type in avg_types:
            for difficulty in difficulty_levels:
                new_key = 'Average/{}_{}'.format(type,
                                                 difficulty)  # do not consider sign class
                new_value = [selected_key for selected_key in
                             result_dict.keys() if
                             type.lower() == selected_key.lower().split('/')[
                                 -1] and difficulty.lower() in selected_key.lower() and 'sign' not in selected_key.lower()]
                new_value = [result_dict[i] for i in new_value]
                new_value = sum(new_value) / len(new_value) if len(
                    new_value) != 0 else 0
                result_dict[new_key] = new_value

                new_key = 'Harmonic_mean/{}_{}_R40'.format(type, difficulty)
                new_value = statistics.harmonic_mean(new_value)
                result_dict[new_key] = new_value

    # TODO: NuScenes
    else:
        raise NotImplementedError
    return result_dict

def eval_one_epoch(cfg, model, dataloader, epoch_id, logger, dist_test=False, save_to_file=False, result_dir=None, args=None):
    result_dir.mkdir(parents=True, exist_ok=True)

    final_output_dir = result_dir / 'final_result' / 'data'
    if save_to_file:
        final_output_dir.mkdir(parents=True, exist_ok=True)

    metric = {
        'gt_num': 0,
    }
    for cur_thresh in cfg.MODEL.POST_PROCESSING.RECALL_THRESH_LIST:
        metric['recall_roi_%s' % str(cur_thresh)] = 0
        metric['recall_rcnn_%s' % str(cur_thresh)] = 0

    dataset = dataloader.dataset
    class_names = dataset.class_names
    det_annos = []

    logger.info('*************** EPOCH %s EVALUATION *****************' % epoch_id)
    if dist_test:
        num_gpus = torch.cuda.device_count()
        local_rank = cfg.LOCAL_RANK % num_gpus
        model = torch.nn.parallel.DistributedDataParallel(
                model,
                device_ids=[local_rank],
                broadcast_buffers=False
        )
    model.eval()

    if cfg.get('SELF_TRAIN', None) and cfg.SELF_TRAIN.get('DSNORM', None):
        model.apply(set_ds_target)

    if cfg.LOCAL_RANK == 0:
        progress_bar = tqdm.tqdm(total=len(dataloader), leave=True, desc='eval', dynamic_ncols=True)
    start_time = time.time()
    for i, batch_dict in enumerate(dataloader):
        load_data_to_gpu(batch_dict)
        with torch.no_grad():
            if cfg.MODEL.NAME.endswith('MT'):
                batch_dict = batch_dict[-1]
                pred_dicts, ret_dict = model(batch_dict, is_ema=True)
            elif cfg.get('SELF_TRAIN', None) and (cfg.SELF_TRAIN.get('MT', None) or ('MT' in cfg.DATA_CONFIG_TAR.DATASET)):
                batch_dict = batch_dict[-1]
                pred_dicts, ret_dict = model(batch_dict)
            else:
                pred_dicts, ret_dict = model(batch_dict)
        disp_dict = {}

        statistics_info(cfg, ret_dict, metric, disp_dict)
        annos = dataset.generate_prediction_dicts(
            batch_dict, pred_dicts, class_names,
            output_path=final_output_dir if save_to_file else None
        )
        det_annos += annos
        if cfg.LOCAL_RANK == 0:
            progress_bar.set_postfix(disp_dict)
            progress_bar.update()

    if cfg.LOCAL_RANK == 0:
        progress_bar.close()

    if dist_test:
        rank, world_size = common_utils.get_dist_info()
        det_annos = common_utils.merge_results_dist(det_annos, len(dataset), tmpdir=result_dir / 'tmpdir')
        metric = common_utils.merge_results_dist([metric], world_size, tmpdir=result_dir / 'tmpdir')

    logger.info('*************** Performance of EPOCH %s *****************' % epoch_id)
    sec_per_example = (time.time() - start_time) / len(dataloader.dataset)
    logger.info('Generate label finished(sec_per_example: %.4f second).' % sec_per_example)

    if cfg.LOCAL_RANK != 0:
        return {}

    ret_dict = {}
    if dist_test:
        for key, val in metric[0].items():
            for k in range(1, world_size):
                metric[0][key] += metric[k][key]
        metric = metric[0]

    gt_num_cnt = metric['gt_num']
    for cur_thresh in cfg.MODEL.POST_PROCESSING.RECALL_THRESH_LIST:
        cur_roi_recall = metric['recall_roi_%s' % str(cur_thresh)] / max(gt_num_cnt, 1)
        cur_rcnn_recall = metric['recall_rcnn_%s' % str(cur_thresh)] / max(gt_num_cnt, 1)
        logger.info('recall_roi_%s: %f' % (cur_thresh, cur_roi_recall))
        logger.info('recall_rcnn_%s: %f' % (cur_thresh, cur_rcnn_recall))
        ret_dict['recall/roi_%s' % str(cur_thresh)] = cur_roi_recall
        ret_dict['recall/rcnn_%s' % str(cur_thresh)] = cur_rcnn_recall

    total_pred_objects = 0
    for anno in det_annos:
        total_pred_objects += anno['name'].__len__()
    logger.info('Average predicted number of objects(%d samples): %.3f'
                % (len(det_annos), total_pred_objects / max(1, len(det_annos))))

    with open(result_dir / 'result.pkl', 'wb') as f:
        pickle.dump(det_annos, f)

    result_str, result_dict = dataset.evaluation(
        det_annos, class_names,
        eval_metric=cfg.MODEL.POST_PROCESSING.EVAL_METRIC,
        output_path=final_output_dir
    )
    result_dict = add_avg_performance(dataset, result_dict)

    logger.info(result_str)
    ret_dict.update(result_dict)

    # add avg predicted number of objects to tensorboard log
    ret_dict['eval_avg_pred_bboxes'] = total_pred_objects / max(1, len(det_annos))

    logger.info('Result is save to %s' % result_dir)
    logger.info('****************Evaluation done.*****************')
    return ret_dict


if __name__ == '__main__':
    pass
