import json
import os
import numpy as np
import sys
sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), '..')))

from utils import empty_instance_dict, load_calibration, load_novatel_data, convert_novatel_to_pose

vehicle_labels = ['Car', 'Truck', 'Bus']

dataset_root = '/path/to/cadcd'
out_dir = '/your/out/dir'
os.makedirs(out_dir, exist_ok=True)

for date in os.listdir(dataset_root):
    # Load calibration matrices
    # (N.B. in CADC notation, T_A_B is the transformation from B to A, in our notation it's from A to B)
    extrinsics = load_calibration(os.path.join(dataset_root, date, 'calib'))['extrinsics']
    T_IMU_LIDAR = np.array(extrinsics['T_LIDAR_GPSIMU'])

    for scene_id in os.listdir(os.path.join(dataset_root, date)):
        if scene_id == 'calib':
            continue
        
        # Load scene annotations
        with open(os.path.join(dataset_root, date, scene_id, '3d_ann.json')) as json_file:
            scene_data = json.load(json_file)

        # Load inertial measurements of all frames in the scene
        novatel = load_novatel_data(os.path.join(dataset_root, date, scene_id, 'labeled/novatel/data/'))
        T_IMU_ENU_list = convert_novatel_to_pose(novatel)
        T_IMU0_ENU = T_IMU_ENU_list[0]
        yaw_0 = np.deg2rad(-1.0 * float(novatel[0][9]))

        scene_dict = {}
        # Iterate over frames in the scene
        for frame_num, frame_ann in enumerate(scene_data):

            # Compute transformation matrix from LiDAR_t to LiDAR_0
            T_IMUt_ENU = T_IMU_ENU_list[frame_num]
            T_LIDARt_LIDAR0 = T_IMU_LIDAR @ np.linalg.inv(T_IMU0_ENU) @ T_IMUt_ENU @ np.linalg.inv(T_IMU_LIDAR)

            # Iterate over instances in the frame
            for ann in frame_ann['cuboids']:
                # Skip if instance is not a vehicle
                if ann['label'] not in vehicle_labels:
                    continue
                                
                if ann['uuid'] not in scene_dict:
                    scene_dict[ann['uuid']] = empty_instance_dict()
                
                # Transform centroids from LiDAR_t to LiDAR_0
                translation = T_LIDARt_LIDAR0 @ np.array([ann['position']['x'], ann['position']['y'], ann['position']['z'], 1])
                translation = translation.tolist()[0][:3]

                # Compute yaw rotation from LiDAR_t to LiDAR_0
                yaw_t = np.deg2rad(-1.0 * float(novatel[frame_num][9]))
                d_rotation = yaw_t - yaw_0
                rotation_yaw = ann['yaw'] + d_rotation
                rotation = [0., 0., rotation_yaw]

                # Read size (order should be heigth, width, length)
                size = [ann['dimensions']['z'], ann['dimensions']['x'], ann['dimensions']['y']]
                
                scene_dict[ann['uuid']]['timestep'].append(frame_num)
                scene_dict[ann['uuid']]['translation'].append(translation)
                scene_dict[ann['uuid']]['rotation'].append(rotation)
                scene_dict[ann['uuid']]['size'].append(size)
                scene_dict[ann['uuid']]['attribute_label'].append(ann['label'])

        # Save scene dict
        with open(os.path.join(out_dir, f'{date}_{scene_id}.json'), 'w') as json_file:
            json.dump(scene_dict, json_file, indent=4)
        
