\begin{tikzpicture}[baseline]

\pgfplotstableread[col sep=comma]{./data/ood_label_metrics.csv}{\datatable};
\begin{axis}[
width=\columnwidth,
height=.7\columnwidth,
% ylabel={NLL},
% xlabel={},
title={Normalized NLL ($\downarrow$)},
ymax=0.7,
legend style={font=\tiny, 
	fill opacity=0.6, text opacity =1,
        at={(0.02, 0.98)},anchor=north west,
        row sep=-3pt,
        },
legend cell align={left},
% ytick={0, 0.08}, % Define the desired y tick positions
xtick={0, 1,2,3,4}, % Define the desired y tick positions
xticklabels={ID, OOD-1, OOD-2, OOD-3, OOD-4},
yticklabel style={
	% /pgf/number format/fixed, % Use fixed point notation
	% /pgf/number format/precision=2, % Set the number of decimal places
	% /pgf/number format/fixed zerofill, % Fill in trailing zeros
        },
% ymode=log,
]

%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% GP-RBF
\addplot+ [lightgreen, mark=*, 
mark options={solid},
thick,
error bars/.cd,
x dir=both,x explicit,
y dir=both,y explicit,
error bar style={solid}
]
table[x=test_level,y=GP_RBF_NLPD_mean,y error=GP_RBF_NLPD_std] {\datatable};

% GP-Laplace
\addplot+ [darkgreen, mark=*, 
mark options={solid},
thick,
error bars/.cd,
x dir=both,x explicit,
y dir=both,y explicit,
error bar style={solid}
]
table[x=test_level,y=GP_Laplace_NLPD_mean,y error=GP_Laplace_NLPD_std] {\datatable};

%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Deep Kernel Learning
\addplot+ [gold, mark=*, 
mark options={solid},
thick,
error bars/.cd,
x dir=both,x explicit,
y dir=both,y explicit,
error bar style={solid}
]
table[x=test_level,y=GP_deepKL_RBF_NLPD_mean,y error=GP_deepKL_RBF_NLPD_std] {\datatable};

%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

% GP-ARD-RBF
\addplot+ [lightblue, mark=*, 
mark options={solid},
thick,
dotted,
error bars/.cd,
x dir=both,x explicit,
y dir=both,y explicit,
error bar style={solid}
]
table[x=test_level,y=GP_ARD_RBF_NLPD_mean,y error=GP_ARD_RBF_NLPD_std] {\datatable};

% GP-ARD-Laplace
\addplot+ [darkblue, mark=*, 
mark options={solid},
thick,
dotted,
error bars/.cd,
x dir=both,x explicit,
y dir=both,y explicit,
error bar style={solid}
]
table[x=test_level,y=GP_ARD_Laplace_NLPD_mean,y error=GP_ARD_Laplace_NLPD_std] {\datatable};

% GP-ARD-Laplace-full
\addplot+ [purple, mark=*, 
mark options={solid},
thick,
dotted,
error bars/.cd,
x dir=both,x explicit,
y dir=both,y explicit,
error bar style={solid}
]
table[x=test_level,y=GP_ARD_Laplace_full_NLPD_mean,y error=GP_ARD_Laplace_full_NLPD_std] {\datatable};
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

% RFM
\addplot+ [black, mark=*, 
mark options={solid},
thick,
error bars/.cd,
x dir=both,x explicit,
y dir=both,y explicit,
error bar style={solid}
]
table[x=test_level,y=GP_RFM_Laplace_NLPD_mean,y error=GP_RFM_Laplace_NLPD_std] {\datatable};


% RFM-diag
\addplot+ [blackgray, mark=*, 
mark options={solid},
thick,
error bars/.cd,
x dir=both,x explicit,
y dir=both,y explicit,
error bar style={solid}
]
table[x=test_level,y=GP_RFM_Laplace_diag_NLPD_mean,y error=GP_RFM_Laplace_diag_NLPD_std] {\datatable};

%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

% NG-Boost
\addplot+ [orange, mark=*, 
mark options={solid},
thick,
dashed,
error bars/.cd,
x dir=both,x explicit,
y dir=both,y explicit,
error bar style={solid}
]
table[x=test_level,y=NG_Boost_NLPD_mean,y error=GP_RFM_Laplace_NLPD_std] {\datatable};


% Cat-Boost-Ensemble
\addplot+ [red, mark=*, 
mark options={solid},
thick,
dashed,
error bars/.cd,
x dir=both,x explicit,
y dir=both,y explicit,
error bar style={solid}
]
table[x=test_level,y=Cat_Boost_Ensemble_NLPD_mean,y error=Cat_Boost_Ensemble_NLPD_std] {\datatable};



% \legend{
%     {GP-RBF},
%     {GP-Laplace},
%     {GP-ARD-RBF},
%     {GP-ARD-Laplace},
%     {GP-RFM-Laplace}, 
%     {NGBoost},
%     {CatBoost-Ensemble}
% }

\end{axis}
\end{tikzpicture}