%% The first command in your LaTeX source must be the \documentclass command.
%%
%% Options:
%% twocolumn : Two column layout. Do not use twocolumn for papers submitted to CEUR-WS!
%% hf: enable header and footer.
\documentclass[
% twocolumn,
% hf,
]{ceurart}

%%
%% One can fix some overfulls
\sloppy

%%
%% Minted listings support 
%% Need pygment <http://pygments.org/> <http://pypi.python.org/pypi/Pygments>
\usepackage{listings}
%% auto break lines
\lstset{breaklines=true}


% Custom package import
%%
\usepackage{afterpage}

\usepackage{tikz}
\usepackage{pgfplots}
\pgfplotsset{width=\linewidth}

\usepackage{tcolorbox}
\usepackage{xcolor}
\usepackage{lipsum}
\usepackage{makecell}
\usepackage{enumitem}
\setlist[itemize]{itemsep=0pt,parsep=0pt}

\newcommand\red[1]{{\color{red}#1}}
\newcommand\orange[1]{{\color{orange}#1}}

% \usepackage{soul}

% Define a new styled text box environment
\newtcolorbox{styledtext}[2][]{%
  colback=white,
  colframe=black,
  fonttitle=\bfseries,
  title=#2,
  label=#1,
}
\newtcolorbox{styledtexttt}[2][]{%
  colback=white,
  colframe=black,
  fonttitle=\bfseries,
  fontupper=\sffamily,
  title=#2,
  label=#1,
}

% Source Sans Pro
\newcommand{\sans}[1]{{\fontfamily{SourceSansPro-TLF}\selectfont #1}}
% \newcommand{\sans}[1]{{\fontfamily{LibertinusSans-TLF}\selectfont #1}}


% for heatmap tables
\usepackage{colortbl}
\usepackage{array}

% Define color gradient from white to green
\definecolor{green0}{RGB}{255,255,255}   % white
\definecolor{green1}{RGB}{240,248,240}   % very light green
\definecolor{green2}{RGB}{220,240,220}   % light green
\definecolor{green3}{RGB}{180,220,180}   % medium light green
\definecolor{green4}{RGB}{140,200,140}   % medium green
\definecolor{green5}{RGB}{100,180,100}   % darker green
\definecolor{green6}{RGB}{60,160,60}     % dark green

% Function to determine color based on percentage (without decimal)
\newcommand{\heatcell}[1]{%
  \ifnum#1<10\relax\cellcolor{green0}#1\fi%
  \ifnum#1>9\ifnum#1<20\relax\cellcolor{green1}#1\fi\fi%
  \ifnum#1>19\ifnum#1<30\relax\cellcolor{green2}#1\fi\fi%
  \ifnum#1>29\ifnum#1<50\relax\cellcolor{green3}#1\fi\fi%
  \ifnum#1>49\ifnum#1<70\relax\cellcolor{green4}#1\fi\fi%
  \ifnum#1>69\ifnum#1<85\relax\cellcolor{green5}#1\fi\fi%
  \ifnum#1>84\relax\cellcolor{green6}#1\fi%
}
\newcommand{\heatcellcolor}[1]{%
  \ifnum#1<10\relax\cellcolor{green0}\fi%
  \ifnum#1>9\ifnum#1<20\relax\cellcolor{green1}\fi\fi%
  \ifnum#1>19\ifnum#1<30\relax\cellcolor{green2}\fi\fi%
  \ifnum#1>29\ifnum#1<50\relax\cellcolor{green3}\fi\fi%
  \ifnum#1>49\ifnum#1<70\relax\cellcolor{green4}\fi\fi%
  \ifnum#1>69\ifnum#1<85\relax\cellcolor{green5}\fi\fi%
  \ifnum#1>84\relax\cellcolor{green6}\fi%
}

\newcommand{\pro}{\textsc{ProverbIT}\xspace}
\usepackage{xspace}


% Custom package import
\usepackage{breakurl}
\def\UrlBreaks{\do\/\do-}


\definecolor{tableblue}{rgb}{0.678, 0.847, 0.902} % 
\definecolor{tableorange}{rgb}{1.0, 0.7, 0.5} % 
\DeclareRobustCommand{\legendsquare}[1]{%
  \textcolor{#1}{\rule{3ex}{1.5ex}}%
}




%%
%% end of the preamble, start of the body of the document source.
\begin{document}

%%
%% Rights management information.
%% CC-BY is default license.
\copyrightyear{2026}
\copyrightclause{Copyright for this paper by its authors.
  Use permitted under Creative Commons License Attribution 4.0
  International (CC BY 4.0).}

%%
%% This command is for the conference information
\conference{EVALITA 2026: 9th Evaluation Campaign of Natural Language
Processing and Speech Tools for Italian, Feb 26 – 27, Bari, IT}

%%
%% The "title" command
\title{ProverbIT - Easy to complete, hard to choose:
A CALAMITA Challenge}

% \tnotemark[1]
% \tnotetext[1]{You can use this document as the template for preparing your
  % publication. We recommend using the latest version of the ceurart style.}

% %%
% %% The "author" command and its associated commands are used to define
% %% the authors and their affiliations.
% \author[1,2]{Dmitry S. Kulyabov}[%
% orcid=0000-0002-0877-7063,
% email=kulyabov-ds@rudn.ru,
% url=https://yamadharma.github.io/,
% ]
% \cormark[1]
% \fnmark[1]
% \address[1]{Peoples' Friendship University of Russia (RUDN University),
%   6 Miklukho-Maklaya St, Moscow, 117198, Russian Federation}
% \address[2]{Joint Institute for Nuclear Research,
%   6 Joliot-Curie, Dubna, Moscow region, 141980, Russian Federation}

% \author[3]{Ilaria Tiddi}[%
% orcid=0000-0001-7116-9338,
% email=i.tiddi@vu.nl,
% url=https://kmitd.github.io/ilaria/,
% ]
% \fnmark[1]
% \address[3]{Vrije Universiteit Amsterdam, De Boelelaan 1105, 1081 HV Amsterdam, The Netherlands}

% \author[4]{Manfred Jeusfeld}[%
% orcid=0000-0002-9421-8566,
% email=Manfred.Jeusfeld@acm.org,
% url=http://conceptbase.sourceforge.net/mjf/,
% ]
% \fnmark[1]
% \address[4]{University of Skövde, Högskolevägen 1, 541 28 Skövde, Sweden}

% %% Footnotes
% \cortext[1]{Corresponding author.}
% \fntext[1]{These authors contributed equally.}


%%
%% The "author" command and its associated commands are used to define
%% the authors and their affiliations.
\author[1]{Enrico Mensa}[%
% orcid=,
email=enrico.mensa@unito.it ,
% url=,
]
\cormark[1]
\fnmark[1]
\author[2]{Lorenzo Zane}[%
% orcid=,
email=lorenzozane98@gmail.com,
% url=,
]
\fnmark[1]
\author[1]{Calogero J. Scozzaro}[%
% orcid=,
email=calogerojerik.scozzaro@unito.it,
% url=,
]
\author[1]{Matteo {Delsanto}}[%
% orcid=,
email=matteo.delsanto@unito.it,
% url=,
]
\author[2]{Tommaso Milani}[%
% orcid=,
email=milani.tommaso2004@gmail.com,
% url=,
]
\author[1]{Daniele P. Radicioni}[%
% orcid=,
email=daniele.radicioni@unito.it,
% url=,
]

\address[1]{Department of Computer Science, University of Turin, Turin, Italy}
\address[2]{Independent Researcher}

%% Footnotes
\cortext[1]{Corresponding author.}
\fntext[1]{These authors contributed equally.}




%%
%% The abstract is a short summary of the work to be presented in the
%% article.
\begin{abstract}
We present \pro, a benchmark designed to evaluate the reasoning capabilities of Large Language Models (LLMs) beyond simple pattern matching. While current models demonstrate high proficiency in text generation, their ability to discriminate between plausible but incorrect options remains understudied. \pro addresses this gap through a challenging multiple-choice task focused on Italian proverbs. In this setting, models are provided with the beginning of a proverb and must select the correct completion from five options.  Crucially, four options are always incorrect distractors, making the fifth option, `None of the others', the only valid answer. This adversarial design forces models to abandon surface-level heuristics and engage in deeper semantic reasoning to actively discard misleading alternatives. To distinguish between a lack of knowledge and a failure in discriminative reasoning, we also introduce a generative completion baseline, where models simply complete the proverb from its initial fragment. The dataset comprises 100 common Italian proverbs, curated and validated by native speakers. 
\end{abstract}

%%
%% Keywords. The author(s) should pick words that accurately describe
%% the work being presented. Separate the keywords with commas.
\begin{keywords}
Large Language Models \sep
Reasoning \sep 
Multi-choice questions \sep
Italian Proverbs
\end{keywords}

%%
%% This command processes the author and affiliation and title
%% information and builds the first part of the formatted document.

\maketitle

\input{sections/01_introduction}

\input{sections/02_challenge}

\input{sections/03_dataset}

\input{sections/04_metrics}

\input{sections/05_results}

\input{sections/06_limitations}

\input{sections/07_ethics}

\input{sections/08_copyright}










% \section{Acknowledgments}

% Identification of funding sources and other support, and thanks to
% individuals and groups that assisted in the research and the
% preparation of the work should be included in an acknowledgment
% section, which is placed just before the reference section in your
% document.

% This section has a special environment:
% \begin{lstlisting}
% \begin{acknowledgments}
%   These are different acknowledgments.
% \end{acknowledgments}
% \end{lstlisting}
% so that the information contained therein can be more easily collected
% during the article metadata extraction phase, and to ensure
% consistency in the spelling of the section heading.

% Authors should not prepare this section as a numbered or unnumbered
% \verb|\section|; please use the ``\verb|acknowledgments|'' environment.

% \section{Appendices}

% If your work needs an appendix, add it before the
% ``\verb|\end{document}|'' command at the conclusion of your source
% document.

% Start the appendix with the ``\verb|\appendix|'' command:
% \begin{lstlisting}
% \appendix
% \end{lstlisting}
% and note that in the appendix, sections are lettered, not
% numbered. 

%%
%% The acknowledgments section is defined using the "acknowledgments" environment
%% (and NOT an unnumbered section). This ensures the proper
%% identification of the section in the article metadata, and the
%% consistent spelling of the heading.
%\begin{acknowledgments}
  % Thanks to the developers of ACM consolidated LaTeX styles
  % \url{https://github.com/borisveytsman/acmart} and to the developers
  % of Elsevier updated \LaTeX{} templates
  % \url{https://www.ctan.org/tex-archive/macros/latex/contrib/els-cas-templates}.  
%\end{acknowledgments}

%% The declaration on generative AI comes in effect
%% in Janary 2025. See also
%% https://ceur-ws.org/GenAI/Policy.html
\section*{Declaration on Generative AI}
  % {\em Either:}\newline
  % The author(s) have not employed any Generative AI tools.
  % \newline
  
 % \noindent{\em Or (by using the activity taxonomy in ceur-ws.org/genai-tax.html):\newline}
 % During the preparation of this work, the author(s) used X-GPT-4 and Gramby in order to: Grammar and spelling check. Further, the author(s) used X-AI-IMG for figures 3 and 4 in order to: Generate images. After using these tool(s)/service(s), the author(s) reviewed and edited the content as needed and take(s) full responsibility for the publication’s content. 

 During the preparation of this work, the authors used gemini-3-pro-preview in order to: Grammar and spelling check. After using these tool, the authors reviewed and edited the content as needed and takes full responsibility for the publication’s content. 

%%
%% Define the bibliography file to be used
\bibliography{ceur}

%%
%% If your work has an appendix, this is the place to put it.
\appendix

% \section{Online Resources}


% The sources for the ceur-art style are available via
% \begin{itemize}
% \item \href{https://github.com/yamadharma/ceurart}{GitHub},
% % \item \href{https://www.overleaf.com/project/5e76702c4acae70001d3bc87}{Overleaf},
% \item
%   \href{https://www.overleaf.com/latex/templates/template-for-submissions-to-ceur-workshop-proceedings-ceur-ws-dot-org/pkfscdkgkhcq}{Overleaf
%     template}.
% \end{itemize}

\end{document}

%%
%% End of file
