import os
import json
import argparse


def get_splits_paths(dataset_path):
    # Get the names of all subfolders in the given folder
    im_path = os.path.join(dataset_path, "images")
    pc_path = dataset_path
    splits = ["Training", "Validation"]
    split_path = os.path.join(dataset_path, "splits")
    os.makedirs(split_path, exist_ok=True)
    for split in splits:
        im_split_path = os.path.join(im_path, split)
        pc_split_path = os.path.join(pc_path, split).replace(
            dataset_path, "data/arkitscenes"
        )
        split_names = [f.name for f in os.scandir(im_split_path) if f.is_dir()]
        split_dict = {}
        for name in split_names:
            im_split_name_path = os.path.join(im_split_path, name, "color")
            co_split_name_path = os.path.join(im_split_path, name, "correspondence")
            png_files = [
                f for f in os.listdir(im_split_name_path) if f.endswith(".png")
            ]
            png_files = sorted(png_files, key=lambda x: float(x.split("_")[1][:-4]))
            co_files = [f for f in os.listdir(co_split_name_path) if f.endswith(".npy")]
            co_files = sorted(co_files, key=lambda x: float(x[:-4]))
            # Get the full paths of the .png files
            png_file_paths = [
                os.path.join(im_split_name_path, f).replace(
                    dataset_path, "data/arkitscenes"
                )
                for f in png_files
            ]
            co_file_paths = [
                os.path.join(co_split_name_path, f).replace(
                    dataset_path, "data/arkitscenes"
                )
                for f in co_files
            ]
            for i in range(0, len(png_file_paths), 4):
                split_dict[f"{name}_{i//4}"] = {}
                split_dict[f"{name}_{i//4}"]["pointclouds"] = os.path.join(
                    pc_split_path, name
                )
                split_dict[f"{name}_{i//4}"]["images"] = png_file_paths[i : i + 4]
                split_dict[f"{name}_{i//4}"]["correspondences"] = co_file_paths[
                    i : i + 4
                ]
        with open(os.path.join(split_path, f"{split}.json"), "w") as f:
            json.dump(split_dict, f, indent=4)


# Example usage
if __name__ == "__main__":
    parser = argparse.ArgumentParser()
    parser.add_argument(
        "--dataset_root",
        required=True,
        help="Path to the arkitscenes dataset containing scene folders",
    )
    config = parser.parse_args()
    get_splits_paths(config.dataset_root)
