\begin{table}[h]
    \begin{minipage}{1\textwidth}
         \centering
         %%%%%% LOC UNIMODAL
        \resizebox{\linewidth}{!}{
            \begin{small}
            \begin{tabular}{
                @{ }l@{  }  l@{ }l@{ }l@{ }l@{ } l@{ }l@{ }l@{ }l@{ }
            }
            \toprule
            & \multicolumn{8}{c}{ \cellcolor{lblue} \texttt{LOC}} \\
            & \multicolumn{4}{c}{$X_{\text{test}}^{*}$} & \multicolumn{4}{c}{$X_{\text{test}}$} \\
            & \textbf{ACC} & \textbf{F1} & \textbf{TNR} & \textbf{TPR} 
            & \textbf{ACC} & \textbf{F1} & \textbf{TNR} & \textbf{TPR}\\
            \midrule
            Video 
            & 87.1(1.2) & 98.0 (0.2) & 98.0(0.4) & 75.6(2.5)
            & - & - & - & - \\
            \midrule
            Audio 
            % audio complete
            & 57.6(1.5) & 96.0(0.2) & 95.5(4) & 19.7(2.9)
            % audio all
            & 55.6 (1.8) & 83.2(3.2) & 71.6(5.1) & 39.6(6.3) \\
            Visual Field  & 66.2(3.4) & 92.8(2.5) & 89.5(4.4) & 43.0(9.4)
            & 72.9(4.0) & 92.1(3.0) & 85.8(5.2) & 60.1(7.2)\\
            Pedals & 69.2(2.5) & 96.6(0.2) & 95.8(0.5) & 42.6(5.4)
            & 68.5(1.5) & 89.5(0.3) & 81.2(1.0) & 55.7(3.4)\\
            Electrocardiograms & 60.3(3.4) & 96.1(0.8) & 95.0(1.5) & 25.5(6.8)
            & 55.9(3.0) & 93.9(1.7) & 88.9(3.0) & 23.0(7.8)\\
            Electromyograms & 58.5(12.9) & 26.8(11.7) & 22.8(10.2) & 94.2(9.5) 
            & 54.9(4.2) & 27.5(10.8) & 21.6(30.6) & 88.1(22.5) \\
            \bottomrule
            \end{tabular}
         \end{small}
        }
        \captionsetup{font=footnotesize}
        \caption{\textbf{Performance of unimodal encoders for \texttt{LOC}.} Audio, VF, PAL, ECG, EMG performances are evaluated after the \textit{anchoring} (i.e after the alignment to the anchor, the video). We report the results on $X_{\text{test}}$ and $X_{\text{test}}^{\text{*}}$ in form: mean(std).
        } 
        \label{tab:unimodal-loc}
        \end{minipage}
        \hfill
        \begin{minipage}{\textwidth}
            %% STRESS UNIMODAL
            \centering
            \resizebox{0.5\linewidth}{!}{
                \begin{small}
                \begin{tabular}{
                    @{ }l@{  }  l@{ }l@{ } l@{ }l@{ }
                }
                \toprule
                & \multicolumn{4}{c}{ \cellcolor{lblue} \texttt{StressID}} \\
                & \multicolumn{2}{c}{$X_{\text{test}}^{*}$} & \multicolumn{2}{c}{$X_{\text{test}}$} \\
                & \textbf{ACC} & \textbf{F1}
                & \textbf{ACC} & \textbf{F1} \\
                \midrule
                EDA &
                58.0 (2.8) & 65.4 (4) &  64.0(2.2) & 64.1(2.1)\\
                RR &
                57.1(4.1) & 58.0(4.8) & 58.4 (3.0) & 58.0(3.4) \\
                ECG &
                55.6(3.6) & 39.8(7.3) & 55.5(2.2) & 48.7(4.0) \\
                Audio &
                59.9(6.2) & 66.9(9.1) & - & - \\
                \bottomrule
                \end{tabular}
             \end{small}
            }
            \captionsetup{font=footnotesize}
            \caption{\textbf{Performance of unimodal encoders for \texttt{StressID}.} Audio, EDA, ECG and RR performances are evaluated after the \textit{anchoring} (i.e after the alignment to the anchor, the video). We report the results on $X_{\text{test}}$ and $X_{\text{test}}^{\text{*}}$ in form: mean(std).
            } 
            \label{tab:unimodal-stress}
        \end{minipage}
        \hfill
       \begin{minipage}{\textwidth}
                 \centering
          \resizebox{0.60\linewidth}{!}{
          \begin{small}
        \begin{tabular}{
            l@{  }  r@{ }r@{ }r@{ } r@{ }r@{ }r@{ } r@{ }r@{ }r@{ }
        }
        \toprule
        & \multicolumn{9}{c}{ \cellcolor{lblue} \textbf{\texttt{LOC}}}  \\ 
        & \textbf{ACC} & $+\Delta$ & & \textbf{TNR} & $+\Delta$ & & \textbf{TPR} &  $+\Delta$ &
        \\
        \midrule
         & 67.4(1.3) & & & 65.3(1.6) &  & & 69.5 (1.5)& 
        % stress - 2 classes
        % & 69.5(3.7) & & & 50.2(8) & & & 88.7(5.6) & &
        \\
        \textit{real-life} & 
        61.9(7.2) & 5.5 & & 70.1(2.1) & -4.8 & & 61.4(10.4) & 8.1 &
        % % stress - 2 classes
        % & 60.0(4.8) & 9.5 & & 66.9(9.5) & -5.0 & & 53.1(7.9) & 24 &
        \\
        \textit{no video} &  
        % loc - 2 classes
        64.9(8.3) & 2.5 & & 63.0(15.2) & 2.3 & & 66.8(6.5) & 2.7 & 
        \\
        % % stress - 2 classes
        % & 61.2(4.6) & 8.3 & & 53.7(10.1) & 8.5 & & 68.8(7.1) & 8.3 &
        % \\
        \textit{no audio}
        % % loc 2 classes
        &  64.9(8.3) & 2.5 & & 63.0(15.2) & 2.3 & & 66.8(6.4) & 2.7 & 
        \\
        % % stress - 2 classes
        % & 68.3(2.9) & 1.2 & & 65.8(6.8) & -4.0 & & 70.7(7.4) &6.4 &
        % \\
        \bottomrule
        \end{tabular}
        \end{small}
    }
    \captionsetup{font=footnotesize}
    \caption{\textbf{Evaluation of ADAPT on three modality scenarios on $X_{\text{test}}^{\text{*}}$ for \texttt{LOC}.} For each scenario, we remove
    one or two modalities from the test samples. We report mean and standard deviation for ACC, TNR, and
    TPR, and calculate the differences ($\Delta$) compared to tests without removed modality.}
    \label{tab:scenarios_inter}
       \end{minipage}
\end{table}