\begin{figure*}[!htb]
  \centering
  \scalebox{.5}{
\begin{tikzpicture}
    \draw (0,0) grid (6,6);
    \fill[blue] (0,5) rectangle (1,6);
    \fill[red] (1,5) rectangle (2,6);
    \fill[blue] (2,5) rectangle (3,6);

    \fill[red] (1,4) rectangle (2,5);
    \fill[blue] (2,4) rectangle (3,5);
    \fill[blue] (2,4) rectangle (3,5);
    \fill[blue] (3,4) rectangle (4,5);

    \fill[blue] (0,3) rectangle (1,4);
    \fill[blue] (3,3) rectangle (4,4);

    \fill[blue] (2,2) rectangle (3,3);
    \fill[red] (4,2) rectangle (5,3);

    \fill[red] (1,1) rectangle (2,2);
    \fill[blue] (3,1) rectangle (4,2);

    \fill[blue] (0,0) rectangle (1,1);
    \fill[blue] (3,0) rectangle (4,1);
    \fill[red] (1,0) rectangle (2,1);
    \fill[blue] (5,0) rectangle (6,1);

    \node[] at (2.5,6.5) {\Huge features $\to$};
    \node [rotate=-90] at (-.5,4) {{\Huge items $\to$}};

    \node[] at (-1,7.5) {\Huge (a)};

    \hspace{-1cm}

    \node[] at (9,7.5) {\Huge (b)};
    
    \draw (10,2) grid (13,5);
    \node[] at (15,3.5) {\scalebox{5}{$=$}};
    %\node[] at (12,5.5) {\LARGE classifier $m$'s prediction of item $1$};
    \node[] at (11.5,6.2) {\LARGE classifier $m$'s labeling};
    \node[] at (11.6,5.5) {\LARGE probabilities of item $1$};
    \fill[black!70] (10,4) rectangle (11,5);
    \fill[black!5] (11,4) rectangle (12,5);
    \fill[black!25] (12,4) rectangle (13,5);

    \fill[black!20] (10,3) rectangle (11,4);
    \fill[black!60] (11,3) rectangle (12,4);
    \fill[black!20] (12,3) rectangle (13,4);

    \fill[black!5] (10,2) rectangle (11,3);
    \fill[black!15] (11,2) rectangle (12,3);
    \fill[black!80] (12,2) rectangle (13,3);
    

    \draw (17,2) grid (20,5);
    \node[] at (18.5,6.2) {\LARGE classifier $m$'s baseline};
    \node[] at (18.4,5.5) {\LARGE confusion matrix factors};
    \fill[black!50] (17,4) rectangle (18,5);
    \fill[black!20] (18,4) rectangle (19,5);
    \fill[black!25] (19,4) rectangle (20,5);

    \fill[black!30] (17,3) rectangle (18,4);
    \fill[black!60] (18,3) rectangle (19,4);
    \fill[black!15] (19,3) rectangle (20,4);

    \fill[black!15] (17,2) rectangle (18,3);
    \fill[black!20] (18,2) rectangle (19,3);
    \fill[black!55] (19,2) rectangle (20,3);
    

    \node[] at (21,3.5) {\scalebox{5}{$+$}};
    \draw (22,2) grid (25,5);
    \node[] at (23.5,5.5) 
    {\LARGE feature 1};
    \fill[black!15] (22,4) rectangle (23,5);
    \fill[black!10] (23,3) rectangle (24,4);
    \fill[black!20] (24,2) rectangle (25,3);

    

    \node[] at (26,3.5) {\scalebox{5}{$+$}};
    \draw (27,2) grid (30,5);
    \node[] at (28.5,5.5) 
    {\LARGE feature 2};
    \fill[black!5] (28,4) rectangle (29,5);
    \fill[black!15] (29,4) rectangle (30,5);

    \fill[black!15] (27,3) rectangle (28,4);
    \fill[black!5] (29,3) rectangle (30,4);

    \fill[black!2] (27,2) rectangle (28,3);
    \fill[black!10] (28,2) rectangle (29,3);


    \node[] at (31,3.5) {\scalebox{5}{$+$}};
    \draw (32,2) grid (35,5);
    \node[] at (33.5,5.5) 
    {\LARGE feature 3};

    \fill[black!5] (32,4) rectangle (33,5);
    \fill[black!10] (33,3) rectangle (34,4);
    \fill[black!20] (34,2) rectangle (35,3);
    
\end{tikzpicture}}
\caption{Illustration of our proposed method, item-dependent BCC (idBCC). (a). The presence of shared latent features that can either increase classification accuracy (blue) or decrease classification accuracy (red) is inferred for every item. (b) The confusion matrix of each classifier conditioned on the item is the softmaxed sum of the baseline factors unique to classifier $m$ that determine its classification probabilities in the absence of any latent features (its confusion matrix is just the softmax of those factors over each row) and the (classifier-specific) inferred effects of each latent feature belonging to the item. Conditioning on the label of the item selects a row of the confusion matrix representing the classifier's labling probabilities (features can be shared across items of potentially different ground-truth label).}\label{fig:cartoon}
\end{figure*}