import datasets
from scripts.utils import load_single_dataset, save_dataset


def process_row(row):
    row["messages"] = [
        {"role": "user", "content": row["conversations"][0]["value"]},
        {"role": "assistant", "content": row["conversations"][1]["value"]},
    ]
    row["score"] = 1 if row["kto_tag"] else -1
    return row


ds = load_single_dataset("~/LLaMA-Factory-250514/data/qwen3sft_train10_responses01234567_scored_valid.json")
ds = ds.map(process_row, num_proc=64)
ds = ds.remove_columns(["kto_tag", "conversations"])
save_dataset(ds, "~/LLaMA-Factory-250514/data/qwen3sft_train10_responses01234567_scored_valid_rc.json")
