#!/usr/bin/env python

import argparse
from transformers import AutoTokenizer
import os
import torch

def download_and_save_tokenizer(model_id: str, save_directory: str):
    os.makedirs(save_directory, exist_ok=True)
    
    print(f"Downloading tokenizer for {model_id}...")
    tokenizer = AutoTokenizer.from_pretrained(model_id, trust_remote_code=True)
    
    print("Saving tokenizer...")
    tokenizer.save_pretrained(save_directory)
    
    print(f"Tokenizer have been saved to: {save_directory}")

def main():
    parser = argparse.ArgumentParser(
        description="Download and save a Hugging Face tokenizer."
    )
    parser.add_argument("--model_id", type=str, help="The model identifier (e.g., facebook/opt-125m)")
    parser.add_argument("--save_dir", type=str, help="The save directory")
    args = parser.parse_args()
    
    SAVE_DIRECTORY = os.path.join(args.save_dir)
    download_and_save_tokenizer(args.model_id, SAVE_DIRECTORY)

if __name__ == "__main__":
    main()
