import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

df_original = pd.read_csv('document/basic_understanding/all_scores_original.csv')
df_modified = pd.read_csv('document/basic_understanding/all_scores_modified.csv')

plt.rcParams['font.family'] = 'avenir'
plt.rcParams['font.weight'] = 'bold'


fig, axes = plt.subplots(1, 3, figsize=(20, 6))
difficulties = ['easy', 'medium', 'hard']
colors = ['#83c5be', '#006d77'] 

for idx, difficulty in enumerate(difficulties):
    orig_data = df_original[df_original['Difficulty'] == difficulty]
    mod_data = df_modified[df_modified['Difficulty'] == difficulty]
    
    x = np.arange(len(orig_data['Model']))
    width = 0.4
    
    bars1 = axes[idx].bar(x - width/2, orig_data['Objective Score'], width, 
                          label='w/o adjustment', color=colors[0], alpha=0.8)
    bars2 = axes[idx].bar(x + width/2, mod_data[mod_data.columns[2]], width, 
                          label='w/ adjustment', color=colors[1], alpha=0.8)
    
    axes[idx].set_title(f'{difficulty.capitalize()} Difficulty', pad=20, fontsize=17)
    axes[idx].set_xticks(x)
    axes[idx].set_xticklabels(orig_data['Model'], rotation=30, ha='right', fontsize=14)
    axes[idx].grid(True, linestyle='--', alpha=0.3)
    axes[idx].yaxis.grid(True, linestyle='--', alpha=0.7) 
    
    if idx == 0:
        axes[idx].set_ylabel('Score')
    else:
        axes[idx].tick_params(labelleft=False)
    
    axes[idx].tick_params(axis='y', labelsize=18)

handles, labels = axes[0].get_legend_handles_labels()
fig.legend(handles, labels, loc='upper center', ncol=2, fontsize=15)


plt.tight_layout()
# fig.suptitle('Comparison of Original vs Modified Scores by Difficulty Level', 
            #  y=1.05, fontsize=14, fontweight='bold')

plt.subplots_adjust(top=0.829, bottom=0.43, right=0.993, left=0.032, wspace=0.1)  # 增加水平间距并调整顶部间距

plt.savefig('answer_leakage.pdf', bbox_inches='tight', dpi=500)
# plt.show()