
import jsonlines

data_1 = list(jsonlines.open('Task_1/math_500_parsed_information_missing_all_r1_non_cls_thoughts_evaluated_s1_answer_evaluated.jsonl'))
data_2 = list(jsonlines.open('Task_1/math_500_parsed_information_missing_all_r1_non_cls_data.jsonl'))

data_2 = [item for item in data_2 if len(item['thought'].split('\n\n')) >=4]
for item_1, item_2 in zip(data_1, data_2):
    if not item_1['metadata']['unclear_task'] == item_2['unclear_task']:
        print(item_1)
        print(item_2)
        exit()
