import os
import json

METHOD = "confidence_score"


def extract_scores(root_path):

    for dirpath, dirnames, filenames in os.walk(root_path):
        if 'score.jsonl' in filenames and os.path.basename(dirpath) == 'logp@answer':
            src_file = os.path.join(dirpath, 'score.jsonl')
            target_dir = os.path.join(os.path.dirname(
                dirpath), METHOD)
            os.makedirs(target_dir, exist_ok=True)
            target_file = os.path.join(target_dir, 'score.jsonl')

            scores = []
            with open(src_file, 'r', encoding='utf-8') as f:
                for line in f:
                    line = line.strip()
                    if not line:
                        continue
                    try:
                        data = json.loads(line)
                        if METHOD == 'confidence_score':
                            scores.append(
                                {'score_name': 'confidence_score',
                                 'score': sum(data['logp_list'][:data['answer_start']]) / len(data['logp_list'][:data['answer_start']])+sum(data['logp_list'][data['answer_start']:data['answer_end']])})
                        else:
                            raise ValueError(f"UNKNOWN: {METHOD}")
                    except json.JSONDecodeError as e:
                        print(f"JSON FAIL: {src_file} -> {e}")

            with open(target_file, 'w', encoding='utf-8') as f:
                for item in scores:
                    f.write(json.dumps(item, ensure_ascii=False) + '\n')

            print(f"DONE {src_file} -> {target_file}")


if __name__ == '__main__':
    root_path = '../judge/'
    extract_scores(root_path)
