import json

def read_jsonl(file_path):
    data = []
    with open(file_path, 'r', encoding='utf-8') as f:
        for line in f:
            if line.strip():  # 跳过空行
                try:
                    item = json.loads(line)
                    data.append(item)
                except json.JSONDecodeError as e:
                    print(f"解析出错: {e}，内容为: {line}")
    return data

sft_data = read_jsonl('deduplicated_markdown4_unicode_5k_no_chinese.jsonl')
len_sft = len(sft_data)
for i in range(len_sft):
    sft_sample_now = sft_data[i]
    # print(sft_sample_now.keys())
    # print(sft_sample_now['url'])
    # print(sft_sample_now['id'])
    # print(sft_sample_now['input'])
    # print(sft_sample_now['output'])
    if not ('### example 1' in sft_sample_now['input'] and '### example 2' in sft_sample_now['input']):
        print("REEOR1!!!")
    if not ('''"cot":''' in sft_sample_now['input'] and '''"code":''' in sft_sample_now['input']):
        print("REEOR2!!!")
    # break

rl_train_data = read_jsonl('verl_train.jsonl')
len_rl_train = len(rl_train_data)
for i in range(len_rl_train):
    rl_train_sample_now = rl_train_data [i]
    # print(rl_train_sample_now.keys())
    # print(rl_train_sample_now['data_source'])
    # print(rl_train_sample_now['ability'])
    # print(rl_train_sample_now['prompt'])
    # print(rl_train_sample_now['prompt'][0].keys())
    # print(rl_train_sample_now['prompt'][0]['content'])
    # print(rl_train_sample_now['prompt'][0]['role'])
    # print(rl_train_sample_now['reward_model'])
    # print(rl_train_sample_now['reward_model'].keys())
    # print(rl_train_sample_now['reward_model']['ground_truth'])
    # print(rl_train_sample_now['reward_model']['ground_truth'].keys())
    # print(rl_train_sample_now['reward_model']['ground_truth']['code'])
    # print(rl_train_sample_now['reward_model']['ground_truth']['id'])
    if not ('Input 1' in rl_train_sample_now['prompt'][0]['content'] and 'Input 2' in rl_train_sample_now['prompt'][0]['content'] and
        'Output 1' in rl_train_sample_now['prompt'][0]['content'] and 'Output 2' in rl_train_sample_now['prompt'][0]['content']):
        print("REEOR1!!!")
    if not ('code' in rl_train_sample_now['reward_model']['ground_truth'].keys() and 'id' in rl_train_sample_now['reward_model']['ground_truth'].keys()):
        print("REEOR2!!!")
    # break