import jsonlines



file1_omni = 'Task_1_analysis/omni_math_{}_{}_non_cls_thought_1_evaluated.jsonl'
file2_omni = 'Task_1_analysis/omni_math_{}_{}_non_cls_thought_2_evaluated.jsonl'
file1_math = 'Task_1_analysis/math_500_{}_{}_non_cls_thought_1_evaluated.jsonl'
file2_math = 'Task_1_analysis/math_500_{}_{}_non_cls_thought_2_evaluated.jsonl'
# file = 'Task_1_analysis/math_500_{}_{}_non_cls_thought_2_evaluated.jsonl'
# file = 'Task_1_analysis/math_500_{}_basic_{}_non_cls_thought_2_evaluated.jsonl'

type = 'information_missing_level1'
for model in ['r1', 'qwen_thinking']:
# for model in ['qwen38b_type4_sft']:
    data_1 = list(jsonlines.open(file1_math.format(type, model)))
    data_2 = list(jsonlines.open(file2_math.format(type, model)))
    problem_set_1 = set()
    problem_set_2 = set()
    for item in data_1:
        if item['judge_res']:
            problem_set_1.add(item['task'])
    for item in data_2:
        if item['judge_res']:
            problem_set_2.add(item['task'])
    print(len(problem_set_1.union(problem_set_2))/len(data_1))
    exit()
