import os

os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "1"
import json
from pathlib import Path

from huggingface_hub import snapshot_download
from tqdm import tqdm

root = Path("../../../data/vq/imagenet/train")
root.mkdir(exist_ok=True, parents=True)

# snapshot_download(
#     repo_id="ILSVRC/imagenet-1k", repo_type="dataset", local_dir=str(root)
# )

# exit()


dt = {}

with open("./imagenet_classes.txt") as f:
    dt = json.load(f)


for p in tqdm(root.glob("*")):
    key = p.stem
    if key not in dt:
        print(key)
        continue
    name = dt[key]
    p.rename(p.parent / name)
print("done")
