import pandas as pd
import matplotlib.pyplot as plt
import os

df = pd.read_csv('output_data/bild_finetuning_results-sept29-10pm.csv')

print(df.columns)


numeric_columns = ['alpha_rb', 'avg_confidence', 'large_token_proportion', 'small_token_proportion', 'quality_score']
df_numeric = df[numeric_columns]

# Group the data by alpha_rb and take the mean of the numeric columns
df_grouped = df_numeric.groupby('alpha_rb').mean()

alpha_rb = df_grouped.index
avg_confidence = df_grouped['avg_confidence']
large_token_proportion = df_grouped['large_token_proportion']
small_token_proportion = df_grouped['small_token_proportion']
quality_score = df_grouped['quality_score']

if not os.path.exists('graphs'):
    os.makedirs('graphs')

# avg_confidence vs alpha_rb
plt.figure()
plt.plot(alpha_rb, avg_confidence, marker='o', color='b')
plt.title('alpha_rb vs avg_confidence (Averaged)')
plt.xlabel('alpha_rb')
plt.ylabel('avg_confidence')
plt.savefig('graphs/alpha_rb_vs_avg_confidence_avg.png')
plt.close()  # Close the figure after saving

# large_token_proportion vs alpha_rb
plt.figure()
plt.plot(alpha_rb, large_token_proportion, marker='o', color='g')
plt.title('alpha_rb vs large_token_proportion (Averaged)')
plt.xlabel('alpha_rb')
plt.ylabel('large_token_proportion')
plt.savefig('graphs/alpha_rb_vs_large_token_proportion_avg.png')
plt.close()

# small_token_proportion vs alpha_rb
plt.figure()
plt.plot(alpha_rb, small_token_proportion, marker='o', color='r')
plt.title('alpha_rb vs small_token_proportion (Averaged)')
plt.xlabel('alpha_rb')
plt.ylabel('small_token_proportion')
plt.savefig('graphs/alpha_rb_vs_small_token_proportion_avg.png')
plt.close()

# quality_score vs alpha_rb
plt.figure()
plt.plot(alpha_rb, quality_score, marker='o', color='m')
plt.title('alpha_rb vs quality_score (Averaged)')
plt.xlabel('alpha_rb')
plt.ylabel('quality_score')
plt.savefig('graphs/alpha_rb_vs_quality_score_avg.png')
plt.close()

print("Averaged plots have been saved in the 'graphs' folder.")
