import json
import glob
import os
import shutil
import matplotlib.pyplot as plt

test_model = 'llm'
check_folder = f'result/valresult/{test_model}'
success_list = []
skipNotSure = False

threshold_pass = 0
threshold_fail = 1

cannotjudge = 0

file_error = 0
video_error = 0

subquestion_true_num = 0
subquestion_false_num = 0


subquestion_tt = 0
subquestion_ff = 0
subquestion_tf = 0
subquestion_ft = 0

subquestion_notsure = 0

right_arr = []
save_arr = []
notsure_arr = []
for i in range(443):
    folder_id = i // 2500
    if not os.path.exists(f'{check_folder}/batch_{folder_id}/video_{i}'):
        continue
    for j in range(8):
        json_path = f'{check_folder}/batch_0/video_{i}/video_{i}_{j}_0.json'
        if not os.path.exists(json_path):
            continue

        gt_video = False
        judge_video = False
        
        # if os.path.exists(f'download_labeled/video_{i}/video_{i}_{j}.mp4'):
        #     gt_video = True
        gt_video = True

        notsure = False
        with open(json_path, "r", encoding="utf-8") as f:
            data = json.load(f)
        if not isinstance(data['vlm_result'], (dict, list)):
            video_error += 1
            continue

        vlm_result = data['vlm_result']
        weight = data['weight']
        score = 0
        notsure_single_num = 0
        for k in range(len(vlm_result)):
            if isinstance(vlm_result[k], str):
                file_error += 1
                continue
            if 'sure' in vlm_result[k]['result']:
                notsure_single_num += 1
            
            if skipNotSure and 'sure' in vlm_result[k]['result']:
                notsure = True
                subquestion_notsure += 1
                break
            if vlm_result[k]['result'] != 'True':
                
                if 'sure' in vlm_result[k]['result'] and int(vlm_result[k]['confidence_score']) < 4:
                    continue

                if False and 'sure' in vlm_result[k]['result'] and int(vlm_result[k]['confidence_score']) < 3:
                    pass
                else:
                    score += 1
        if notsure_single_num > 4:
            score += 1
        notsure_arr.append(notsure_single_num)
        if not skipNotSure or not notsure: 
            if score > threshold_pass and score < threshold_fail:
                cannotjudge += 1
                continue
            right_arr.append(f'video_{i}_{j}.mp4')
            if score <= threshold_pass:
                judge_video = True
                success_list.append(f'video_{i}')
            if score >= threshold_fail:
                judge_video = False

            if judge_video and gt_video:
                subquestion_tt += 1
            elif not judge_video and not gt_video:
                subquestion_ff += 1
            elif judge_video and not gt_video:
                subquestion_tf += 1
            elif not judge_video and gt_video:
                subquestion_ft += 1
        
            if gt_video:
                subquestion_true_num += 1
            else:
                subquestion_false_num += 1


print(f'{test_model}: file_error: {file_error}', f'video_error: {video_error}')
print('--------------------------------')
print(f'SubQuestion: pass: {subquestion_tt}/{subquestion_true_num}, fail: {subquestion_ff}/{subquestion_false_num}, notsure: {subquestion_notsure}, true/false: {subquestion_tf}, false/true:{subquestion_ft}, cannotjudge: {cannotjudge}')
    
    
