import os
import datetime
import openpyxl
from openpyxl.styles import PatternFill, Font
import numpy as np
from collections import defaultdict
from tqdm import tqdm
import json
import argparse

def just_open(filename):
    filename = os.path.abspath(filename)  # Excel打开时需要使用绝对路径
    xlApp = Dispatch("Excel.Application")
    xlApp.Visible = False  # 确保Excel应用程序不可见
    xlApp.DisplayAlerts = False  # 关闭所有警告对话框
    xlApp.ScreenUpdating = False  # 禁用屏幕更新
    try:
        xlBook = xlApp.Workbooks.Open(Filename=filename, UpdateLinks=False, ReadOnly=False)
        xlBook.Save()
        xlBook.Close(SaveChanges=True)
    except Exception as e:
        print(f"An error occurred: {e}")
    finally:
        xlApp.Quit()
        
def parse_option():
    parser = argparse.ArgumentParser("command line arguments for evaluation.")
    
    parser.add_argument('--model', type=str, default="multi_gpt-4o-no-df-5-rounds", help='model name')
    parser.add_argument('--dataset', type=str, default="ablation_50", help='dataset name')

    opt = parser.parse_args()

    return opt


def datetime_to_float(dt):
    # Excel dates start from 1899-12-30, which is 0 in Excel (due to a bug, 1900 is considered a leap year in Excel)
    excel_start_date = datetime.datetime(1899, 12, 30)
    delta = dt - excel_start_date
    return delta.days + delta.seconds / 86400.0


def transform_value(v):
    if isinstance(v, (int, float)):
        v = round(float(v), 2)
    elif isinstance(v, datetime.time):
        v = str(v)[:-3]
    elif isinstance(v, datetime.datetime):
        v = round(datetime_to_float(v), 0)
    elif isinstance(v, str):
        try:
            v = round(float(v), 2)
        except ValueError:
            pass
    return v


def compare_cell_value(v1, v2):

    v1 = transform_value(v1)
    v2 = transform_value(v2)
    if (v1 == "" and v2 is None) or (v1 is None and v2 == ""):
        return True
    if (v1 == "" and v2 == "") or (v1 is None and v2 is None):
        return True
    if type(v1) != type(v2):
        # print(type(v1), type(v2))
        return False
    if v1 == v2:
        return True
    else:
        return False


def compare_fill_color(fill1, fill2):
    fgColor1 = fill1.fgColor.rgb if fill1.fgColor else None
    fgColor2 = fill2.fgColor.rgb if fill2.fgColor else None
    bgColor1 = fill1.bgColor.rgb if fill1.bgColor else None
    bgColor2 = fill2.bgColor.rgb if fill2.bgColor else None

    if fgColor1 == fgColor2 and bgColor1 == bgColor2:
        return True
    else:
        return False


def compare_font_color(font_gt, font_proc):
    if font_gt.color is not None and font_proc.color is not None:
        return font_gt.color.rgb == font_proc.color.rgb
    elif font_gt.color is None and font_proc.color is None:
        return True
    else:
        return False


def sheet_level_compare(ws_gt, ws_proc):
    # 比较行数和列数是否相等
    if ws_gt.max_row != ws_proc.max_row or ws_gt.max_column != ws_proc.max_column:
        msg = f"Different dimensions: ws_gt has {ws_gt.max_row} rows and {ws_gt.max_column} columns,\
                while ws_proc has {ws_proc.max_row} rows and {ws_proc.max_column} columns."
        return False, msg

    # 遍历所有单元格，比较值和格式
    for row in range(1, ws_proc.max_row + 1):
        for col in range(1, ws_proc.max_column + 1):
            cell_gt = ws_gt.cell(row=row, column=col)
            cell_proc = ws_proc.cell(row=row, column=col)
            
            # 比较单元格值
            if compare_cell_value(cell_gt.value, cell_proc.value):
                msg = f"Value difference at cell {cell_gt.coordinate}: ws_gt has {cell_gt.value},\
                      ws_proc has {cell_proc.value}"
                return False, msg
            
            # # 比较单元格填充颜色
            # if not compare_fill_color(cell_gt.fill, cell_proc.fill):
            #     msg = f"Fill color difference at cell {cell_gt.coordinate}: ws_gt has {cell_gt.fill.fgColor.rgb},\
            #            ws_proc has {cell_proc.fill.fgColor.rgb}"
            #     return False, msg

            # # 比较单元格字体颜色
            # if not compare_font_color(cell_gt.font, cell_proc.font):
            #     # msg = f"Font color difference at cell {cell_gt.coordinate}: ws_gt has {cell_gt.font.color.rgb},\
            #     #        ws_proc has {cell_proc.font.color.rgb}"
            #     msg = f"Font color difference at cell {cell_gt.coordinate}"
            #     return False, msg
            
    print("Sheets are identical.")
    return True, ""


def col_num2name(n):
    """ Convert a column number to an Excel column name """
    name = ''
    while n > 0:
        n, remainder = divmod(n - 1, 26)
        name = chr(65 + remainder) + name
    return name


def col_name2num(name):
    """ Convert an Excel column name to a column number """
    num = 0
    for c in name:
        num = num * 26 + (ord(c) - ord('A') + 1)
    return num


def parse_cell_range(range_str):
    """ Parse a range string like 'A1:AB12' """
    start_cell, end_cell = range_str.split(':')
    start_col, start_row = '', ''
    for char in start_cell:
        if char.isdigit():
            start_row += char
        else:
            start_col += char
    
    end_col, end_row = '', ''
    for char in end_cell:
        if char.isdigit():
            end_row += char
        else:
            end_col += char

    return (col_name2num(start_col), int(start_row)), (col_name2num(end_col), int(end_row))


def generate_cell_names(range_str):
    """ Generate a list of all cell names in the specified range """
    if ':' not in range_str:
        return [range_str]
    (start_col, start_row), (end_col, end_row) = parse_cell_range(range_str)
    columns = [col_num2name(i) for i in range(start_col, end_col + 1)]
    cell_names = [f"{col}{row}" for col in columns for row in range(start_row, end_row + 1)]
    return cell_names


def cell_level_compare(wb_gt, wb_proc, sheet_name, cell_range , is_CF):
    if sheet_name not in wb_proc:
        return False, "worksheet not found"
    ws_gt = wb_gt[sheet_name]
    ws_proc = wb_proc[sheet_name]

    # 解析单元格范围
    cell_names = generate_cell_names(cell_range)

    # 遍历指定范围内的单元格，比较值
    for cell_name in cell_names:
        cell_gt = ws_gt[cell_name]
        cell_proc = ws_proc[cell_name]

        # 比较单元格值
        if not compare_cell_value(cell_gt.value, cell_proc.value):
            msg = f"Value difference at cell {cell_gt.coordinate}: ws_gt has {cell_gt.value},\
                    ws_proc has {cell_proc.value}"
            return False, msg
        
        if is_CF:
            # 比较单元格填充颜色
            if not compare_fill_color(cell_gt.fill, cell_proc.fill):
                msg = f"Fill color difference at cell {cell_gt.coordinate}: ws_gt has {cell_gt.fill.fgColor.rgb},\
                        ws_proc has {cell_proc.fill.fgColor.rgb}"
                return False, msg

            # 比较单元格字体颜色
            if not compare_font_color(cell_gt.font, cell_proc.font):
                # msg = f"Font color difference at cell {cell_gt.coordinate}: ws_gt has {cell_gt.font.color.rgb},\
                #        ws_proc has {cell_proc.font.color.rgb}"
                msg = f"Font color difference at cell {cell_gt.coordinate}"
                return False, msg

    print("Cell values in the specified range are identical.")
    return True, ""


def compare_workbooks(gt_file, proc_file, instruction_type, answer_position):
    if not os.path.exists(proc_file):
        return False, "File not exist"
    # Open workbooks
    if "CF" in proc_file:
        is_CF = True
    else:
        is_CF = False
    try:
        # just_open(wb_proc)
        wb_gt = openpyxl.load_workbook(filename=gt_file, data_only=True)
        wb_proc = openpyxl.load_workbook(filename=proc_file, data_only=True)
    except Exception as e:
        return False, str(e)

    # Initialize report
    result = False
    msg = ""

    sheet_cell_ranges = answer_position.split(',')
    for sheet_cell_range in sheet_cell_ranges:
        if '!' in sheet_cell_range:
            sheet_name, cell_range = sheet_cell_range.split('!')
            sheet_name = sheet_name.lstrip("'").rstrip("'")
        else:
            sheet_name = wb_gt.sheetnames[0]
            cell_range = sheet_cell_range
    result, msg = cell_level_compare(wb_gt, wb_proc, sheet_name, cell_range , is_CF)

    return result, msg


if __name__ == "__main__":
    opt = parse_option()

    with open(f'{opt.dataset}/dataset.json', 'r') as fp:
        dataset = json.load(fp)

    eval_results = []
    for data in tqdm(dataset):
        test_case_results = []
        suffix = 'xlsx'
        for test_case_idx in range(3):
            gt_path = f"{opt.dataset}/spreadsheet/{data['id']}/{test_case_idx + 1}_{data['id']}_answer.{suffix}"
            proc_path = f"{opt.dataset}/outputs/{opt.model}/{test_case_idx + 1}_{data['id']}_output.{suffix}"
            try:
                result, message = compare_workbooks(gt_path, proc_path, data['instruction_type'], data['answer_position'])
            except:
                result = 0
            test_case_results.append(int(result))
        soft_restriction = test_case_results.count(1) / len(test_case_results)
        hard_restriction = 0 if 0 in test_case_results else 1
        eval_results.append({
            'id': data['id'],
            'instruction_type': data['instruction_type'],
            'test_case_results': test_case_results,
            'soft_restriction': soft_restriction,
            'hard_restriction': hard_restriction,
        })
    
    with open(f'{opt.dataset}/outputs/eval_{opt.model}.json', 'w') as fp:
        json.dump(eval_results, fp, indent=4)
