import torch, os, json, tqdm

class Ego4D:
    def __init__(self, vision_pretrained: str, embed_mark: str, frame_fps: int, local_debug: bool, **kwargs):
        super().__init__(**kwargs)
        if local_debug:
            self.root = ""
            self.video_root = os.path.join(self.root, 'full_scale')
            self.anno_root = os.path.join(self.root, 'annotations')
        else:
            self.root = ""
            self.video_root = ""
            self.anno_root = os.path.join(self.root, 'annotations')
        self.embed_dir = f"{self.video_root}_{embed_mark}_{vision_pretrained.replace('/', '--')}"
        self.frame_fps = frame_fps
        self.local_debug = local_debug
        self.metadata = self.get_metadata() if not local_debug else None
        self.annos: list[dict]

    def __len__(self):
        return len(self.annos)

    def get_metadata(self, ):
        metadata_path = f'{self.embed_dir}_metadata.json'
        if os.path.exists(metadata_path):
            print(f'load {metadata_path}...')
            metadata = json.load(open(metadata_path))
        else:
            metadata = {}
            for file in tqdm.tqdm(os.listdir(self.embed_dir), desc=f'prepare {metadata_path}...'):
                path = os.path.join(self.embed_dir, file)
                duration = (len(torch.load(path)) - 1) / self.frame_fps  # in seconds
                key = os.path.splitext(os.path.basename(path))[0]
                metadata[key] = {'duration': duration, 'path': path}
            json.dump(metadata, open(metadata_path, 'w'), indent=4)
        return metadata
