from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import os.path as osp
import numpy as np
import pickle
import collections

from dataset.joints_dataset_3dhp import JointsDataset3dhp
import multiviews.cameras as cam_utils

class MultiView3dhp2d(JointsDataset3dhp):
    def __init__(self, cfg, image_set, is_train, transform=None):
        super().__init__(cfg, image_set, is_train, transform)
        self.actual_joints = {
            0: 'pelvis',
            1: 'head_top',
            2: 'neck',
            3: 'right_shoulder',
            4: 'right_elbow',
            5: 'right_wrist',
            6: 'left_shoulder',
            7: 'left_elbow',
            8: 'left_wrist',
            9: 'right_hip',
            10: 'right_knee',
            11: 'right_ankle',
            12: 'left_hip',
            13: 'left_knee',
            14: 'left_ankle',
            15: 'spine',
            16: 'head',
        }

        self.u2a_mapping = super().get_mapping()

        grouping_db_pickle_file = osp.join(self.root, 'mpi-inf-3dhp', 'quickload',
                                           '3dhp_quickload_{}.pkl'
                                           .format(image_set))
        if osp.isfile(grouping_db_pickle_file):
            with open(grouping_db_pickle_file, 'rb') as f:
                grouping_db = pickle.load(f)
                self.grouping = grouping_db['grouping']
                self.db = grouping_db['db']
                #self.grouping16 = grouping_db['grouping16']
        else:
            anno_file = osp.join(self.root, 'mpi-inf-3dhp', 'annot',
                                 '3dhp_{}.pkl'.format(image_set))
            self.db = self.load_db(anno_file)

            self.u2a_mapping = super().get_mapping()
            super().do_mapping()

            self.grouping = self.get_group(self.db)
            #self.grouping16 = self.get_group16(self.db)
            #grouping_db_to_dump = {'grouping': self.grouping, 'db': self.db, 'grouping16': self.grouping16}
            #with open(grouping_db_pickle_file, 'wb') as f:
            #    pickle.dump(grouping_db_to_dump, f)

        if self.is_train:
            self.grouping = self.grouping[::6]
            #self.grouping16 = self.grouping16[::20]
        else:
            self.grouping = self.grouping[::5]
            #self.grouping16 = self.grouping16[::]

        self.group_size = len(self.grouping)
        self.selected_cam = [0,1,2,3]

    def index_to_action_names(self):
        return {
            1: 'Walking/Standing',
            2: 'Exercise',
            3: 'Sitting(1)',
            4: 'Crouch/Reach',
            5: 'On the Floor',
            6: 'Sports',
            7: 'Sitting(2)',
            8: 'Miscellaneous',
        }
    
    def load_db(self, dataset_file):
        with open(dataset_file, 'rb') as f:
            dataset = pickle.load(f)
            return dataset

    def get_group(self, db):
        grouping = {}
        nitems = len(db)
        mpp={}
        mpp[0] = 0
        mpp[2] = 1
        mpp[7] = 2
        mpp[8] = 3
        for i in range(nitems):
            keystr ='s_{:01}_seq_{:01}_imgid_{:06}'.format(db[i]['action'], db[i]['seq'],db[i]['image_id'])
            #print(keystr)
            if not osp.exists(self.root+'mpi-inf-3dhp/images/'+ 's_{:01}_seq_{:01}_ca_{:01}'.format(db[i]['action'], db[i]['seq'],db[i]['camera_id'])):
                continue

            camera_id = mpp[db[i]['camera_id']]
            if keystr not in grouping:
                grouping[keystr] = [-1, -1, -1, -1]
            grouping[keystr][camera_id] = i

        filtered_grouping = []
        for _, v in grouping.items():
            if np.all(np.array(v) != -1):
                filtered_grouping.append(v)

        return filtered_grouping
    
    def get_group16(self, db):
        grouping16 = {}
        nitems = len(db)
        mpp={}
        mpp[0] = 0
        mpp[2] = 1
        mpp[7] = 2
        mpp[8] = 3
        for i in range(nitems):
            keystr ='s_{:01}_seq_{:01}_imgid_{:06}'.format(db[i]['action'], db[i]['seq'],((db[i]['image_id']-1) // 4 * 4 + 1))

            if not osp.exists(self.root+'mpi-inf-3dhp/images/'+ 's_{:01}_seq_{:01}_ca_{:01}'.format(db[i]['action'], db[i]['seq'],db[i]['camera_id'])):
                continue
            
            camera_id = mpp[db[i]['camera_id']]
            if keystr not in grouping16:
                grouping16[keystr] = [-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1]
            grouping16[keystr][camera_id*4+(db[i]['image_id']-1)%4] = i

        filtered_grouping = []
        for _, v in grouping16.items():
            if np.all(np.array(v) != -1):
                filtered_grouping.append(v)

        return filtered_grouping
    
    def __getitem__(self, idx):
        input, target, weight, meta,target16 = [], [], [], [],[]
        items = self.grouping[idx]
        #items16 = self.grouping16[idx]
        for item in items:
            i, t, w, m = super().__getitem__(item)
            m['scale'] = m['scale'].astype(np.float32)
            m['center'] = m['center'].astype(np.float32)
            m['rotation'] = int(m['rotation'])
            if 'name' in m['camera']:
                del m['camera']['name']
            for k in m['camera']:
                m['camera'][k] = m['camera'][k].astype(np.float32)

            input.append(i)
            target.append(t)
            weight.append(w)
            meta.append(m)
        """
        for item16 in items16:
            i_, t16_, w_, m_ = super().__getitem__(item16)
            target16.append(t16_)
        """
        return input, target, weight, meta
    
    def __len__(self):
        return self.group_size

    def get_key_str(self, datum):
        return 's_{:01}_seq_{:01}_imgid_{:06}'.format(
            datum['action'], datum['seq'],
            datum['image_id'])
    
    def evaluate(self, pred, *args, **kwargs):
        pred = pred.copy()
        nview = 4
        if 'threshold' in kwargs:
            threshold = kwargs['threshold']
        else:
            threshold = 0.0125
        u2a = self.u2a_mapping
        a2u = {v: k for k, v in u2a.items() if v != '*'}
        a = list(a2u.keys())
        u = list(a2u.values())
        indexes = list(range(len(a)))
        indexes.sort(key=a.__getitem__)
        sa = list(map(a.__getitem__, indexes))
        su = np.array(list(map(u.__getitem__, indexes)))

        gt = []
        flat_items = []
        box_lengthes = []
        cnt = 0
        for items in self.grouping:
            for item in items:
                gt.append(self.db[item]['joints_2d'][su, :2])
                #print(type(keypoints['positions_2d'][1]))
                #print(keypoints['S2'])
                #keypoints['S'+str(self.db[item]['action'])]['seq'+str(self.db[item]['seq'])][mpp[self.db[item]['camera_id']]][self.db[item]['image_id']-1][:,0:2] = pred[cnt][:,0:2]
                flat_items.append(self.db[item])
                boxsize = np.array(self.db[item]['scale']).sum() * 100.0  # crop img pixels
                box_lengthes.append(boxsize)
                cnt = cnt + 1
        
        gt = np.array(gt)
        if pred.shape[1] == 20:
            pred = pred[:, su, :2]
        elif pred.shape[1] == 17:
            pred = pred[:, :, :2]
        detection_threshold = np.array(box_lengthes).reshape((-1, 1)) * threshold

        distance = np.sqrt(np.sum((gt - pred)**2, axis=2))
        detected = (distance <= detection_threshold)

        joint_detection_rate = np.sum(detected, axis=0) / np.float(gt.shape[0])

        name_values = collections.OrderedDict()
        joint_names = self.actual_joints
        for i in range(len(a2u)):
            name_values[joint_names[sa[i]]] = joint_detection_rate[i]
        detected_int = detected.astype(np.int)
        nsamples, njoints = detected.shape
        per_grouping_detected = detected_int.reshape(nsamples // nview, nview * njoints)
        return name_values, np.mean(joint_detection_rate), per_grouping_detected

    def evaluate_3d(self, preds3d, thresholds=None):
        if thresholds is None:
            thresholds = [5., 10., 15., 20., 25., 50., 75., 100., 125., 150.,]

        gt3d = []
        for idx, items in enumerate(self.grouping):
            # note that h36m joints_3d is in camera frame
            db_rec = self.db[items[0]]
            j3d_global = cam_utils.camera_to_world_frame(db_rec['joints_3d'], db_rec['camera']['R'], db_rec['camera']['T'])
            gt3d.append(j3d_global)
        gt3d = np.array(gt3d)

        assert preds3d.shape == gt3d.shape, 'shape mismatch of preds and gt'
        distance = np.sum((preds3d - gt3d)**2, axis=2)

        num_groupings = len(gt3d)
        pcks = []
        for thr in thresholds:
            detections = distance <= thr**2
            detections_perjoint = np.sum(detections, axis=0)
            pck_perjoint = detections_perjoint / num_groupings
            # pck_avg = np.average(pck_perjoint, axis=0)
            pcks.append(pck_perjoint)

        return thresholds, pcks