#!/usr/bin/env python3
# -*- coding: utf-8 -*-

import argparse
import json
from scripts.utils import load_single_dataset,save_dataset


def main():
    parser = argparse.ArgumentParser(
        description="Replace Dataset column 'scores' with a list loaded from a JSON file."
    )
    parser.add_argument("--dataset_json", required=True, help="Path to HF dataset json file")
    parser.add_argument("--list_json", required=True, help="Path to json file storing a list")
    parser.add_argument("--output", required=True, help="Output path to save the new dataset")
    args = parser.parse_args()

    # 1) load dataset (must use this function)
    ds = load_single_dataset(args.dataset_json)

    # 2) load list
    with open(args.list_json, "r", encoding="utf-8") as f:
        new_scores = json.load(f)  # guaranteed same length as ds

    # Replace entire "scores" column
    ds = ds.remove_columns("scores").add_column("scores", new_scores)

    # 3) save dataset (must use this function)
    save_dataset(ds, args.output)


if __name__ == "__main__":
    main()

