\section{List of selected datasets}\label{appendix:datasets}
\input{table_datasets}

\newpage
\section{Figures with original set of datasets}\label{appendix:complete_figures}
The following figures are the same as for \figureref{fig:cumul_counts,fig:stackbar_presence_type} without removing the datasets we considered not having enough matching. The non-presence of a dataset in one of the figures means that no paper contained a matching for this dataset.
\begin{figure}[htbp]
\floatconts
    {fig:cumul_counts_all}
    {\caption{Cumulative counts per year of dataset citations (full line) and mentions (dashed line) for classification datasets (a) and segmentation datasets (b).}} 
    {
        \subfigure{
            \label{fig:cumul_mention_per_dataset_year_all}% label for this sub-figure
            \includegraphics[width=0.45\textwidth]{images/classification_citations_mentions_all.png}
        }
        \subfigure{
            \label{fig:cumul_citations_per_dataset_year_all}
            \includegraphics[width=0.45\textwidth]{images/segmentation_citations_mentions_all.png}
        }
    }
\end{figure}

\begin{figure}[htbp]
\floatconts
  {fig:stackbar_presence_type_all}
  {\caption{Type of presence per dataset and venue. The number in [] indicates the total number of papers for this subset.}}
  {\includegraphics[width=0.55\columnwidth,keepaspectratio]{images/stackbar_presence_type_all.png}}
\end{figure}


\section{Example of dataset presence}\label{appendix:dataset_presence}
\subsection{Citations}
\begin{figure}[htbp]
\floatconts
  {fig:citation1}
  {\caption{Citation of a dataset without mention (Wang et al., 2017, ChestX-Ray8) in the background section for a demonstration of previous use}}
  {\includegraphics[width=0.55\columnwidth,keepaspectratio]{images/citation_background.png}}
\end{figure}

\begin{figure}[htbp]
\floatconts
  {fig:citation2}
  {\caption{Citation with a link to the datasets and not to the paper as indicated in BRATS guideline}}
  {\includegraphics[width=0.55\columnwidth,keepaspectratio]{images/link_citations.png}}
\end{figure}

\subsection{Mentions}
\textbf{In text:}

\begin{figure}[H]
\floatconts
  {fig:mention1}
  {\caption{Mention and citation to the papers of BRATS, following guidelines from the challenge}}
  {\includegraphics[width=0.55\columnwidth,keepaspectratio]{images/citation_mention_brats.png}}
\end{figure}

\begin{figure}[H]
\floatconts
  {fig:mention2}
  {\caption{Mention of BRATS without a proper citation but only a footnote with a link to the data}}
  {\includegraphics[width=0.55\columnwidth,keepaspectratio]{images/mention_no_citation.png}}
\end{figure}

\noindent \textbf{In figures and tables:}
\begin{figure}[H]
\floatconts
  {fig:mention3}
  {\caption{ACDC mentioned in a figure's caption}}
  {\includegraphics[width=0.55\columnwidth,keepaspectratio]{images/ACDC_Figure.png}}
\end{figure}

\begin{figure}[H]
\floatconts
  {fig:mention4}
  {\caption{BRATS mentioned in a table's caption}}
  {\includegraphics[width=0.55\columnwidth,keepaspectratio]{images/BRATS_table.png}}
\end{figure}


\noindent \textbf{In footnotes:}
\begin{figure}[H]
\floatconts
  {fig:mention5}
  {\caption{ACDC dataset's name mentioned in a footnote}}
  {\includegraphics[width=0.55\columnwidth,keepaspectratio]{images/ACDC_footnote.png}}
\end{figure}

\begin{figure}[H]
\floatconts
  {fig:mention6}
  {\caption{CAMELYON dataset mentioned in a footnote with the URL}}
  {\includegraphics[width=0.55\columnwidth,keepaspectratio]{images/camelyon_footnote_url.png}}
\end{figure}

\section{Example of data from OpenAlex}\label{appendix:OA_exemples}
\begin{figure}[H]
\floatconts
    {fig:oa_abs}
    {\caption{Example of abstract obtained from OpenAlex}} 
    {\includegraphics[width=0.5\textwidth]{images/OA_abstract.png}}
\end{figure}
\begin{figure}[H]
\floatconts
    {fig:oa_link}
    {\caption{Example of link to full text PDF obtained from OpenAlex}} 
    {\includegraphics[width=\textwidth]{images/OA_link.png}}
\end{figure}
\begin{figure}[H]
\floatconts
    {fig:oa_refs}
    {\caption{Example of list of citations in a paper obtained from OpenAlex}} 
    {\includegraphics[width=\textwidth]{images/OA_refs.png}}
\end{figure}

\newpage
\section{Example of data from GROBID}\label{appendix:GROBID_exemples}
\begin{figure}[H]
\floatconts
    {fig:grobid_abs}
    {\caption{Example of a header with abstract obtained after GROBID conversion to XML}} 
    {\includegraphics[width=\textwidth]{images/GROBID_header.png}}
\end{figure}
\begin{figure}[H]
\floatconts
    {fig:grobid_content}
    {\caption{Example of full text body obtained after GROBID conversion to XML}} 
    {\includegraphics[width=\textwidth]{images/GROBID_content.png}}
\end{figure}
\begin{figure}[H]
\floatconts
    {fig:grobid_refs}
    {\caption{Example of a citation obtained after GROBID conversion to XML}} 
    {\includegraphics[width=\textwidth]{images/GROBID_refs.png}}
\end{figure}