
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

# --------- 1.  load validation CSV ---------
df = pd.read_csv(
    r"C:/research",
    header=None, engine="c"
)

IDX_CORRECT = 0      # 1 = correct, 0 = incorrect
IDX_CLASS   = 1      # class-id  (0‥195)
IDX_SOFTMAX = 3     # top-softmax score

# --------- 2.  keep only correct predictions ----------
df_corr = df[df[IDX_CORRECT] == 1]

# --------- 3.  per-class mean ± std of softmax --------
gp       = df_corr.groupby(IDX_CLASS)[IDX_SOFTMAX]
mean_sm  = gp.mean()
std_sm   = gp.std().fillna(0.0)        # classes seen once → std = 0

# ensure every of the 196 ids appears on the x-axis
all_ids  = pd.RangeIndex(196)
mean_sm  = mean_sm.reindex(all_ids)
std_sm   = std_sm .reindex(all_ids).fillna(0.0)

# --------- 4.  scatter + error bars plot ---------------
plt.figure(figsize=(12, 3))
plt.errorbar(
    mean_sm.index, mean_sm,
    yerr=std_sm,
    fmt="o", markersize=6,
    elinewidth=0.7, capsize=3
)



plt.xlabel("Class ID (0–195)", fontsize=18)
plt.ylabel("Mean soft-max (correct predictions)", fontsize=18)
plt.title("Stanford Cars – per-class confidence of correct predictions",
          fontsize=21, pad=12)



plt.tight_layout()
plt.show()



















