from omni.isaac.kit import SimulationApp
simulation_app = SimulationApp({
    "headless": True,
    "renderer": "RayTracedLighting",
    "carb_settings": {
        "persistentKernelCache": False 
    }
})
import datetime
from omni.isaac.core.utils.stage import open_stage
from omni.isaac.core import World
import omni.isaac.core.utils.numpy.rotations as rot_utils
from omni.isaac.sensor import Camera
import numpy as np
import omni.usd
from pxr import UsdLux, Gf
from PIL import Image
import os
import json
import time
import argparse
from pathlib import Path
import collections 
import gc
from scipy.spatial.transform import Rotation as R


# def world_to_sensor_camera_quat(q_world):
#     # q_world: [x, y, z, w]，即(omni采集出来的四元数)
#     # 需要和补偿四元数合成
#
#     r_correction = R.from_euler('zy', [90, 90], degrees=True)
#     r_world = R.from_quat(q_world)  # 注意用[x, y, z, w]
#     r_sensor = r_correction * r_world
#     return r_sensor.as_quat()  # [x, y, z, w]


# def world_to_sensor_camera_quat(q_world):
#     # q_world: [x, y, z, w]，即(omni采集出来的四元数)
#     # 需要和补偿四元数合成
#
#     r_correction = R.from_euler('zxy', [-90, 90, -90], degrees=True)
#     r_world = R.from_quat(q_world)  # 注意用[x, y, z, w]
#     r_sensor = r_correction * r_world
#     return r_sensor.as_quat()  # [x, y, z, w]


# def world_to_sensor_camera_quat(q_world):
#     # q_world: [x, y, z, w]，即(omni采集出来的四元数)
#     # 需要和补偿四元数合成
#
#     r_correction = R.from_euler('xy', [90, -90], degrees=True)
#     r_world = R.from_quat(q_world)  # 注意用[x, y, z, w]
#     r_sensor = r_correction * r_world
#     return r_sensor.as_quat()  # [x, y, z, w]

# def world_to_sensor_camera_quat(q_world):
#     # q_world: [x, y, z, w]，即(omni采集出来的四元数)
#     # 需要和补偿四元数合成
#
#     r_correction = R.from_euler('xz', [90, -90], degrees=True)
#     r_world = R.from_quat(q_world)  # 注意用[x, y, z, w]
#     r_sensor = r_correction * r_world
#     return r_sensor.as_quat()  # [x, y, z, w]


# 先把旧的分量重排转成矩阵
# def quat_reorder_old(q):
#     return np.array([q[1], q[3], -q[0], -q[2]])


# def usd_to_isaac_quat(q_usd):
#     """
#     把 USD Camera 系 (-Z前, +Y上) 的 quat 转换成 Isaac Camera 系 (+Z前, +Y上)
#     q_usd: [x, y, z, w]
#     """
#     R_fix = R.from_euler('x', 180, degrees=True)  # USD->Isaac 基系旋转
#     return (R_fix * R.from_quat(q_usd)).as_quat()


class CameraBatchProcessor:
    def __init__(self, config_file, base_usd_path, output_base_path, max_concurrent_cameras=200, start_index=0):
        self.config_file = config_file
        self.base_usd_path = Path(base_usd_path)
        self.output_base_path = Path(output_base_path)
        self.max_concurrent_cameras = max_concurrent_cameras
        self.start_index = start_index
        
        with open(config_file, 'r') as f:
            self.config = json.load(f)
        
        self.scenes = [
            scene for scene in self.config.get('scenes', []) 
            if scene.get('scene_id') is not None and scene.get('scene_id') >= self.start_index
        ]
        
        self.output_base_path.mkdir(parents=True, exist_ok=True)
        
        print(f"找到 {len(self.scenes)} 个待处理场景 (起始ID >= {self.start_index})")



    # def create_camera(self, prim_path, point_info):
    #     position = np.array(point_info['position'])
    #     q_world_usd = np.array(point_info['rotation'])
    #
    #     I = np.array([0, 0, 0, 1])
    #     R_map_old = R.from_quat(quat_reorder_old(I))
    #
    #     # 叠加 X=-90° 的场景全局旋转
    #     R_xneg90 = R.from_euler('zx', [-90, 90], degrees=True)
    #     R_map_new = R_xneg90 * R_map_old
    #
    #     # 新映射一次性包含旧公式和X=-90°
    #     orientation = (R_map_new * R.from_quat(q_world_usd)).as_quat()
    #
    #     np.set_printoptions(precision=20, suppress=True)
    #     print('[{}]'.format(', '.join(f'{x:.20f}' for x in orientation)))
    #
    #     camera = Camera(
    #         prim_path=prim_path,
    #         position=position,
    #         frequency=3,
    #         resolution=(640, 480),
    #         orientation=orientation,
    #     )
    #     camera.initialize()
    #     camera.add_motion_vectors_to_frame()
    #     camera.set_horizontal_aperture(7)
    #     camera.set_vertical_aperture(5)
    #     return camera

    # def create_camera(self, prim_path, point_info):
    #     """创建单个摄像头，并应用位姿"""
    #     position = np.array(point_info['position'])
    #     # position[2] += 1.0
    #
    #     orientation = np.array(point_info['rotation'])
    #     # orientation = world_to_sensor_camera_quat(np.array(point_info['rotation']))
    #     # print(orientation)
    #
    #     np.set_printoptions(precision=20, suppress=True)
    #     result = '[{}]'.format(', '.join(f'{x:.20f}' for x in orientation))
    #     print(result)
    #
    #     camera = Camera(
    #         prim_path=prim_path,
    #         position=position,
    #         frequency=3,
    #         resolution=(640, 480),
    #         orientation=orientation,
    #     )
    #     camera.initialize()
    #     camera.add_motion_vectors_to_frame()
    #     camera.set_horizontal_aperture(7)
    #     camera.set_vertical_aperture(5)
    #     return camera

    def create_camera(self, prim_path, point_info):
        position = np.array(point_info['position'])
        orientation = np.array(point_info['rotation'])  # 直接用，完全不补偿

        camera = Camera(
            prim_path=prim_path,
            position=position,
            frequency=3,
            resolution=(640, 480),
            orientation=orientation
        )
        camera.initialize()
        return camera

    # 839920.usdz
    # def create_camera(self, prim_path, point_info):
    #     """创建单个摄像头，并应用位姿"""
    #     position = np.array(point_info['position'])
    #     # position[2] += 1.0
    #
    #     orientation = np.array(point_info['rotation'])
    #     # orientation = world_to_sensor_camera_quat(np.array(point_info['rotation']))
    #     # print(orientation)
    #
    #     q = orientation
    #     orientation = np.array([q[1], q[3], q[0], -q[2]])
    #     # orientation = world_to_sensor_camera_quat(orientation)
    #
    #     np.set_printoptions(precision=20, suppress=True)
    #     result = '[{}]'.format(', '.join(f'{x:.20f}' for x in orientation))
    #     print(result)
    #
    #
    #     camera = Camera(
    #         prim_path=prim_path,
    #         position=position,
    #         frequency=3,
    #         resolution=(640, 480),
    #         orientation=orientation,
    #     )
    #     camera.initialize()
    #     camera.add_motion_vectors_to_frame()
    #     camera.set_horizontal_aperture(7)
    #     camera.set_vertical_aperture(5)
    #     return camera


    def _setup_new_world(self, scene_path):
        """加载或重新加载场景，并设置好环境"""
        omni.usd.get_context().close_stage()
        gc.collect()
        
        if not open_stage(usd_path=str(scene_path)):
            print(f"错误：无法打开场景文件 {scene_path}")
            return None, None

        stage = omni.usd.get_context().get_stage()
        
        if not stage.GetPrimAtPath("/World/EnvLight"):
            dome = UsdLux.DomeLight.Define(stage, "/World/EnvLight")
            dome.CreateIntensityAttr(30000.0)
            dome.CreateColorAttr(Gf.Vec3f(1.0, 1.0, 1.0))
        
        world = World()
        world.reset()
        
        for _ in range(10): 
            world.step(render=True)
            
        return world, stage

    def process_scene(self, scene_info):
        """
        处理一个场景的所有拍照点。
        修改后的逻辑：只加载一次场景，创建一批摄像头，然后通过调整位置和朝向来拍摄所有照片。
        """
        scene_id = scene_info['scene_id']
        scene_name = scene_info['scene_name']
        
        print(f"\n开始处理场景: {scene_name} (ID: {scene_id})")

        scene_path = self.base_usd_path
        # scene_path = self.base_usd_path / scene_name / f"{scene_name}.usd"
        if not scene_path.exists():
            print(f"警告: 场景文件不存在 {str(scene_path)}，跳过此场景。")
            return None
    
        # 1. 只加载一次场景
        world, stage = self._setup_new_world(scene_path)
        if world is None:
            print(f"错误：无法加载场景 {scene_name}")
            return None
    
        all_points_in_scene = []
        for sample in scene_info['samples']:
            trajectory_id = sample['trajectory_id']
            for point_data in sample['points']:
                point_data_with_context = point_data.copy()
                point_data_with_context['trajectory_id'] = trajectory_id
                all_points_in_scene.append(point_data_with_context)
    
        total_points = len(all_points_in_scene)
        num_batches = (total_points + self.max_concurrent_cameras - 1) // self.max_concurrent_cameras
        print(f"场景 {scene_name} 共有 {total_points} 个拍照点, 将使用 {min(self.max_concurrent_cameras, total_points)} 个摄像头分 {num_batches} 批拍摄")
    
        num_cameras = min(self.max_concurrent_cameras, total_points)
        cameras = []
        for i in range(num_cameras):
            prim_path = f"/World/camera_{i}"
            initial_point = all_points_in_scene[i] if i < len(all_points_in_scene) else all_points_in_scene[0]
            camera = self.create_camera(prim_path, initial_point)
            cameras.append(camera)
            print(f"    创建摄像头 {prim_path}")
        
        for _ in range(10):
            world.step(render=True)
    
        all_results = []
        
        for batch_idx in range(num_batches):
            start_time = time.time()
            chunk_start = batch_idx * self.max_concurrent_cameras
            chunk_end = min(chunk_start + self.max_concurrent_cameras, total_points)
            point_chunk = all_points_in_scene[chunk_start:chunk_end]
            
            print(f"  处理批次 {batch_idx + 1}/{num_batches} (点 {chunk_start+1} 到 {chunk_end})...")

            if batch_idx == 0:
                print("  注意：这是第一次处理批次，摄像头位置和方向将基于初始点进行设置。")
            else :
                for i, point_info in enumerate(point_chunk):
                    if i < len(cameras):  
                        camera = cameras[i]
                        position = np.array(point_info['position'])
                        position[2] += 1.0  #调高相机高度防止贴地
                        orientation = np.array(point_info['rotation'])
                        
                        
                        camera.set_world_pose(position=position, orientation=orientation)
                        print(f"    调整摄像头 {i} 到位置: {point_info['position']}, 方向: {point_info['rotation']}")
    
            for _ in range(10):
                world.step(render=True)
    
            for i, point_info in enumerate(point_chunk):
                if i < len(cameras):
                    camera = cameras[i]
                    rgb_img = camera.get_rgba()[:, :, :3]
                    
                    scene_id = scene_info['scene_id']
                    scene_name = scene_info['scene_name']
                    trajectory_id = point_info['trajectory_id']
                    point_id = point_info['point']
                    
                    image_id = f"scene_{scene_id}_traj_{trajectory_id}_point_{point_id}"
                    
                    trajectory_output_dir = self.output_base_path / f"{scene_name}" / f"trajectory_{trajectory_id}"
                    trajectory_output_dir.mkdir(parents=True, exist_ok=True)
                    
                    output_path = trajectory_output_dir / f"{image_id}.png"
                    Image.fromarray(rgb_img).save(str(output_path))
                    
                    all_results.append({
                        'trajectory_id': trajectory_id,
                        'point_id': point_id,
                        'image_id': image_id,
                        'image_path': f"trajectory_{trajectory_id}/{image_id}.png",
                        'position': point_info['position'],
                        'rotation': point_info['rotation'],
                    })
            
            end_time = time.time()
            print(f"  批次 {batch_idx + 1} 处理完成，耗时 {end_time - start_time:.2f} 秒。")

        updated_scene_data = self.aggregate_and_save_results(scene_info, all_results)
    
        print(f"场景 {scene_name} 处理完成，共拍摄 {len(all_results)} 张照片。")
        return updated_scene_data

    def aggregate_and_save_results(self, scene_info, all_results):
        """将扁平化的结果重新按轨迹组织，保存文件，并返回最终的场景数据结构"""
        scene_id = scene_info['scene_id']
        scene_name = scene_info['scene_name']
        
        results_by_traj = collections.defaultdict(list)
        for res in all_results:
            results_by_traj[res['trajectory_id']].append(res)
            
        original_points_map = {}
        for sample in scene_info['samples']:
            traj_id = sample['trajectory_id']
            for p in sample['points']:
                p['camera_images'] = []
            original_points_map[traj_id] = {p['point']: p for p in sample['points']}

        for trajectory_id, results in results_by_traj.items():
            for result in results:
                point_id = result['point_id']
                original_points_map[trajectory_id][point_id]['camera_images'].append({
                    'image_id': result['image_id'],
                    'image_path': result['image_path'],
                })

            updated_points = list(original_points_map[trajectory_id].values())
            
            trajectory_info = {
                'trajectory_id': trajectory_id,
                'points': updated_points
            }
            for i, sample in enumerate(scene_info['samples']):
                if sample['trajectory_id'] == trajectory_id:
                    scene_info['samples'][i] = trajectory_info
                    break

            scene_output_dir = self.output_base_path / f"{scene_name}"
            trajectory_output_dir = scene_output_dir / f"trajectory_{trajectory_id}"
            if not trajectory_output_dir.exists():
                raise FileNotFoundError(f"输出目录 {trajectory_output_dir} 不存在。")

            trajectory_info_path = trajectory_output_dir / 'trajectory_info.json'
            with open(trajectory_info_path, 'w') as f:
                json.dump(trajectory_info, f, indent=2)

        scene_info_result = {
            'scene_id': scene_id,
            'scene_name': scene_name,
            'samples': scene_info['samples'] 
        }
        scene_info_path = scene_output_dir / 'scene_info.json'
        with open(scene_info_path, 'w') as f:
            json.dump(scene_info_result, f, indent=2)

        return scene_info_result 

    def save_updated_config(self):
        """将内存中完全更新后的 self.config 对象保存到新文件"""
        updated_config_path = self.output_base_path / 'config_with_images.json'
        print(f"\n正在保存包含所有图片信息的最终配置文件到: {updated_config_path}")
        with open(updated_config_path, 'w') as f:
            json.dump(self.config, f, indent=2)
        print("最终配置文件保存成功。")

    def process_all_scenes(self, target_scene_ids=None):
        """处理所有场景，并在结束后保存一个更新过的配置文件"""
        scenes_to_process = [
            s for s in self.scenes if not target_scene_ids or s['scene_id'] in target_scene_ids
        ]
        
        total_scenes = len(scenes_to_process)
        successful_scenes = 0
        
        for i, scene_info in enumerate(scenes_to_process):
            print(f"\n{'='*60}")
            print(f"处理总进度: {i+1}/{total_scenes} - Scene ID: {scene_info['scene_id']}")
            print(f"{'='*60}")

            updated_scene_data = self.process_scene(scene_info)
            
            if updated_scene_data:
                successful_scenes += 1
                for idx, original_scene in enumerate(self.config['scenes']):
                    if original_scene['scene_id'] == updated_scene_data['scene_id']:
                        self.config['scenes'][idx] = updated_scene_data
                        print(f"场景 {scene_info['scene_id']} 的数据已更新到主配置中。")
                        break
            
            gc.collect()
        
        print(f"\n处理完成! 成功处理 {successful_scenes}/{total_scenes} 个场景")
        
        # 在所有处理完成后，保存包含所有新数据的配置文件
        self.save_updated_config()
        
        return successful_scenes == total_scenes


def main():
    parser = argparse.ArgumentParser(description='批量处理摄像头拍照，按场景分批并重载')
    parser.add_argument('--scene_ids', type=int, nargs='*', 
                      help='要处理的场景ID列表 (默认: 处理所有场景)')
    # 修改了参数名称和帮助文本
    parser.add_argument('--max_concurrent_cameras', type=int, default=50,
                      help='每个批次同时创建和拍照的最大摄像头数量。每批处理完后会重载场景。')
    parser.add_argument('--config_file', type=str, 
                      required=True,
                      help='摄像头配置文件路径')
    parser.add_argument('--base_usd_path', type=str,
                      required=True,
                      help='USD文件基础路径')
    parser.add_argument('--output_path', type=str,
                      required=True,
                      help='输出路径')
    parser.add_argument('--start_index',type=int,default=0,help='起始场景ID索引')
    
    args = parser.parse_args()
    
    print(f"单批次最大摄像头数: {args.max_concurrent_cameras}")
    print(f"配置文件: {args.config_file}")
    processor = CameraBatchProcessor(
        config_file=args.config_file,
        base_usd_path=args.base_usd_path,
        output_base_path=args.output_path,
        max_concurrent_cameras=args.max_concurrent_cameras,
        start_index=args.start_index
    )
    
    if not processor.scenes:
        print("错误: 配置文件中没有找到任何符合条件的场景配置")
        simulation_app.close()
        return
    
    success = processor.process_all_scenes(args.scene_ids)
    
    if success:
        print(f"\n✅ 成功完成所有指定场景的处理")
    else:
        print(f"\n⚠️ 部分或全部场景处理失败")
    
    simulation_app.close()

if __name__ == "__main__": 
    main()