\begin{table}[t]
    \centering
    \caption{Summary of evaluation results}
    \begin{tabular}{ccccccc}
        \toprule
        \textbf{Task} &\textbf{Subtask} & \textbf{Metrics} & \textbf{Ours} & \textbf{ANFC}~\cite{zhao2024comprehensive} & \textbf{CAPI}~\cite{gracia2022challenge} & \textbf{Mask-RCNN}~\cite{he2017mask}\\
        \midrule
        Segm. & Capillary Mask & Sens.$\uparrow$  & \textbf{0.827} & 0.653 & ---  & 0.820\\
        KP. & Venous Diameter & MAE$\uparrow$ & 1.813 & \textbf{0.989} & 1.274 & 1.794\\
        KP. & Arterial Diameter& MAE$\downarrow$ & \textbf{0.825} & 0.849 & 0.856 & 1.351\\
        KP. & Apical Diameter& MAE$\downarrow$ &\textbf{0.321} & 1.674  & 0.575 & 1.047 \\
        Class. & Abnormal State &  Accuracy$\uparrow$ & \textbf{0.885} & 0.800  & 0.747 & 0.839\\
        \bottomrule
    \end{tabular}
    \begin{tablenotes}
        \item[1] The test set includes 61 images from various distinct subjects, ensuring no overlap between the subjects in the training and test datasets. Classification metric is calculated per image level and keypoint task's metric is calculated at the pixel level. For the ANFC~\cite{zhao2024comprehensive} we report the original results from the paper. For the CAPI~\cite{gracia2022challenge} and Mask-RCNN~\cite{he2017mask} results, we implemented the method as described in the original paper and evaluated it on the dataset used in this work.
    \end{tablenotes}
    \label{tab:model_metrics}
\end{table}
