# %%
from datasets import load_dataset
from transformers import AutoTokenizer
import os
import json

MODEL_PATH = "<your_model_name>"

dataset_path = os.path.join(
    os.path.dirname(__file__),
    "..",
    "data",
    "env",
    "trainset_4096.jsonl"
)

save_path = os.path.join(
    os.path.dirname(__file__),
    "..",
    "data",
    "env",
    "trainset_4096_grpo.jsonl"
)

hf_dataset = load_dataset("json", data_files=dataset_path, split="train")
tokenizer = AutoTokenizer.from_pretrained(
    MODEL_PATH, trust_remote_code=True)
# %%
problems = [item['messages'][:-1] for item in hf_dataset]
solutions = [item['messages'][-1]['content'] for item in hf_dataset]

problems = tokenizer.apply_chat_template(
    problems,
    add_generation_prompt=True,
    tokenize=False,
)
# %%
with open(save_path, 'w', encoding='utf-8') as f:
    for problem, solution in zip(problems, solutions):
        item = {
            "problem": problem,
            "solution": solution
        }
        f.write(json.dumps(item, ensure_ascii=False) + "\n")