import pandas as pd
import matplotlib.pyplot as plt

df = pd.read_csv('dataset_segno/ver3/data_domain_ver3_maskNone_L/testset_maskmix.csv')

print("List of column names:")
print(df.columns)

if "mask_pattern" in df.columns:
    mask_distribution = df["mask_pattern"].value_counts()
    
    print("\nDistribution of mask patterns:")
    print(mask_distribution)
    
    plt.style.use('ggplot')
    
    plt.figure(figsize=(10, 6), dpi=100)
    
    ax = mask_distribution.plot(kind="bar", edgecolor='black')
    
    plt.xlabel("Mask Pattern", fontsize=14)
    plt.ylabel("Frequency", fontsize=14)
    plt.title("Distribution of Mask Patterns", fontsize=16, fontweight='bold')
    
    plt.grid(True, which='both', linestyle='--', linewidth=0.5, alpha=0.7)
    
    plt.xticks(rotation=45, ha='right', fontsize=12)
    plt.yticks(fontsize=12)
    
    for p in ax.patches:
        ax.annotate(f'{int(p.get_height())}', 
                    (p.get_x() + p.get_width() / 2, p.get_height()), 
                    ha='center', va='bottom', fontsize=12, xytext=(0, 5), textcoords='offset points')
    
    plt.tight_layout()
    
    plt.savefig("mask_distribution_improved.png")
    plt.show()
else:
    print("The specified 'mask_pattern' column was not found. Please check the column names.")