\documentclass{midl} % Include author names

% The following packages will be automatically loaded:
% jmlr, amsmath, amssymb, natbib, graphicx, url, algorithm2e
% ifoddpage, relsize and probably more
% make sure they are installed with your latex distribution
\usepackage{threeparttable}
\usepackage{multirow}
\usepackage{booktabs}
\definecolor{newcolor}{rgb}{.8,.349,.1}


% \usepackage{mwe} % to get dummy images
\jmlrvolume{-- 181}
\jmlryear{2026}
\jmlrworkshop{Full Paper -- MIDL 2026}
\editors{Accepted for publication at MIDL 2026}

\title[What Fine-Tuning Changes]{What Fine-Tuning Changes: A Radiomic Lens on Prostate Foundation Model Representations}

 % Use \Name{Author Name} to specify the name.
 % If the surname contains spaces, enclose the surname
 % in braces, e.g. \Name{John {Smith Jones}} similarly
 % if the name has a "von" part, e.g \Name{Jane {de Winter}}.
 % If the first letter in the forenames is a diacritic
 % enclose the diacritic in braces, e.g. \Name{{\'E}louise Smith}

 % Two authors with the same address
 % \midlauthor{\Name{Author Name1} \Email{abc@sample.edu}\and
 %  \Name{Author Name2} \Email{xyz@sample.edu}\\
 %  \addr Address}

 % Three or more authors with the same address:
 % \midlauthor{\Name{Author Name1} \Email{an1@sample.edu}\\
 %  \Name{Author Name2} \Email{an2@sample.edu}\\
 %  \Name{Author Name3} \Email{an3@sample.edu}\\
 %  \addr Address}


% Authors with different addresses:
% \midlauthor{\Name{Author Name1} \Email{abc@sample.edu}\\
% \addr Address 1
% \AND
% \Name{Author Name2} \Email{xyz@sample.edu}\\
% \addr Address 2
% }

%\footnotetext[1]{Contributed equally}

% More complicate cases, e.g. with dual affiliations and joint authorship
\midlauthor{\Name{Yipei Wang\nametag{$^{1}$}} \orcid{0000-0002-9589-7177} \Email{yipei.wang@ucl.ac.uk}\\
\addr $^{1}$ UCL Hawkes Institute, Department of Medical Physics and Biomedical Engineering, University College London \\
\AND
\Name{Yaxi Chen\nametag{$^{1}$}} \orcid{0009-0007-5906-899X}\Email{yaxi.chen.20@ucl.ac.uk}\\
\Name{Wen Yan\nametag{$^{1}$}} \orcid{0000-0002-3962-5994} \Email{wen-yan@ucl.ac.uk}\\
\Name{Natasha Thorley\nametag{$^{2,3}$}} \orcid{0000-0001-8928-895X}\Email{natasha.thorley@ucl.ac.uk}\\
\addr $^{2}$ Centre for Medical Imaging, University College London\\
\addr $^{3}$ Department of Radiology, University College London Hospital NHS Foundation Trust\\
\AND
\Name{Alexander Ng\nametag{$^{4}$}} \orcid{0000-0001-5441-2017}\Email{alexander.ng@ucl.ac.uk}\\
\addr $^{4}$ Centre for Urology Imaging, Prostate, AI and Surgical Studies (COMPASS) Research Group, Division of Surgery and Interventional Science, University College London \AND
\Name{Dean C. Barratt\nametag{$^{1}$}} \orcid{0000-0003-2916-655X} \Email{d.barratt@ucl.ac.uk}\\
\AND
\Name{Daniel C. Alexander\nametag{$^{1,5}$}} \orcid{0000-0003-2439-350X}\Email{d.alexander@ucl.ac.uk}\\
\addr $^{5}$ Department of Computer Science, University College London\AND
\Name{Shonit Punwani\nametag{$^{2,3}$}} \orcid{0000-0002-1014-0870}\Email{s.punwani@ucl.ac.uk}\\
 \AND
\Name{Mark Emberton\nametag{$^{6,7}$}} \orcid{0000-0003-4230-0338}\Email{m.emberton@ucl.ac.uk}\\
\addr $^{6}$ Department of Urology, University College London Hospital\\
\addr $^{7}$ Division of Surgery and Interventional Science, University College London\\
\AND
\Name{Veeru Kasivisvanathan\nametag{$^{4,6}$}} \orcid{0000-0002-0832-382X}\Email{veeru.kasi@ucl.ac.uk}\\
\AND
\Name{Yipeng Hu\nametag{$^{1}$}} \orcid{0000-0003-4902-0486}\Email{yipeng.hu@ucl.ac.uk}\\
\AND
}

\begin{document}

\maketitle

\begin{abstract}
Clarifying how foundation model encoders change during fine-tuning is important for transparency and trustworthiness in their medical imaging applications. It may also be useful for further understanding, developing, and adapting these models. However, the latent representations produced by such encoders are high dimensional and lack explicit semantic meaning, making it difficult to characterise how task-specific adaptation modifies them. In this study, we introduce a radiomics-based framework that provides an interpretable lens through which these representational changes can be examined and often better understood. 
Using prostate cancer patient imaging data, we train a two-layer MLP to learn the relationship between radiomic descriptors and encoder embeddings prior to fine-tuning. This model captures non-linear associations through its first layer, while the final linear layer offers an interpretable mapping from radiomic attributes to (transformed) latent features. To quantify the effect of fine-tuning, the first layer is fixed, and only the linear layer is re-estimated using the embeddings from the fine-tuned encoder. Comparing the pre- and post-fine-tuning linear weights yields a direct quantitative measure of how the encoder’s emphasis on specific radiomic characteristics shifts during fine-tuning.
We validate the approach using a prostate MRI foundation model and multiple downstream tasks. The analysis reveals consistent, task-dependent changes in the encoder’s sensitivity to radiomic texture and intensity features. This work provides the first radiomics-based methodology for systematically interpreting how fine-tuning restructures foundation model representation in medical imaging. The implementation is available at: \url{https://github.com/pipiwang/RadiomicLens}.
\end{abstract}

\begin{keywords}
mpMRI, Foundation model, Radiomic feature, Interpretability
\end{keywords}

\section{Introduction}
Foundation models which are pre-trained on large-scale datasets, often using a self-supervised learning paradigm, have increasingly been applied to medical related tasks on various modalities and anatomical structures \cite{wu2025towards, zhou2023foundation,fu2025cinema, zhang2024generalist, mcconnell2025computationally}. These recent advances demonstrated the potential of foundation models of achieving better performance for individual applications when being fine-tuned and adapted to specific downstream tasks.
However, current research has been largely motivated by and emphasising performance boosts over existing specialised supervised learning models, whereas the interpretability study on foundation models in medical applications is restricted to saliency maps \cite{zhou2023foundation} or effects on quantitative results of different fine-tuning strategies \cite{mcconnell2025computationally}.
%Whilst focusing on presenting performance boosts over specialised supervised learning models, current research provided limited interpretability study on foundation models in medical applications, such as saliency maps \cite{zhou2023foundation} or effects on quantitative results of different fine-tuning strategies \cite{mcconnell2025computationally}. 
The role of fine-tuning in affecting model behaviour and reshaping representation space in foundation models for medical tasks remains insufficiently studied.


Understanding how foundation model encoders change during fine-tuning is essential for interpreting their behaviour in medical image analysis. Although fine-tuning is known to adapt representations towards a target task, the nature of this adaptation is often opaque. Encoder features are high-dimensional and lack clear semantic meaning, which makes it difficult to understand what prior knowledge is retained, what is modified, and how these changes relate to clinically meaningful image characteristics. Despite the recent research efforts on interpreting deep learning models, existing methods face significant limitations. Concept attribution methods such as Testing with Concept Activation Vectors (TCAV) \cite{kim2018interpretability} require a manually defined set of images that positively represent a concept and another random set that do not; while sparse autoencoders \cite{cunningham2023sparse} produce latent dimensions that may correlate with internal representations, but the resulting factors are not guaranteed to be human-meaningful. The discovered concepts often need post-hoc interpretation which would further add the workload of clinical experts in interpreting ambiguous or uninterpretable latent features. 

Radiomics provides a complementary and interpretable representation of medical images, consisting of comprehensive descriptions such as texture, intensity statistics, and shape descriptors, for a given region of interest (ROI) \cite{zwanenburg2016image, aguirre2025radiomics}. These features provide quantitative characterisations of medical images which contribute to the radiologists' decision-making process on disease diagnosis and treatment planning \cite{tomaszewski2021biological}. Unlike the obscure, high-dimensional features from deep learning models, radiomic features have explicit definitions that allow fine-grained interpretation. In this work, we propose to use radiomic features as an interpretable reference space to analyse how a foundation model encoder changes before and after fine-tuning.

This work proposes to model the relationship between radiomic features and encoder embeddings using a two-layer MLP. The network is first trained on the pre-fine-tuning encoder features so that it can learn a general non-linear mapping while keeping the final linear layer directly interpretable. To analyse how fine-tuning alters the encoder representation, we freeze the first layer of the MLP and solve the interpretation linear head using the fine-tuned embeddings. Comparing the two linear heads then highlights how the influence of each radiomic attribute has changed, offering an interpretable view of the effects of fine-tuning.

% In this work, we focus on finding the changes from foundation model fine-tuning. Specifically, we map the high dimensional features from the encoder of foundation backbones to explainable radiomic features calculated from the original input images. We evaluate xx on xx datasets across xx different tasks. We show that xx. 
%In this study, we show that radiomics can be used as a practical explanation tool for real patient medical images, provide the first radiomics-based analysis that makes fine-tuning behaviour quantified, and demonstrate the approach on a prostate MRI foundation model across multiple downstream tasks. 
In this work, we introduce radiomics as an interpretable framework for explaining encoder representations on real patient medical imaging data. We provide the first radiomics-based analysis that makes encoder changes during fine-tuning quantitatively interpretable. The proposed approach is demonstrated using a prostate MRI foundation model across multiple downstream tasks, showing how radiomics reveal task-specific adaptation.

\section{Method}
We introduce a two-stage framework to investigate the relationship between the internal feature representation of the foundation model and radiomic features calculated directly from images, and capture the changes during task-specific fine-tuning, as shown in Fig.~\ref{fig:main}. At the first stage, features of the foundation model encoder from before and after fine-tuning are projected into a unified, non-linear space; while in the second stage, closed-form linear regression is applied to reconstruct radiomic features from the projected features. By analysing the difference of weights and residuals in the linear decoding between pre- and post- fine-tuning, we provide quantitative measures of representation shift during the fine-tuning process.

\begin{figure}[htbp]
 % Caption and label go in the first argument and the figure contents
 % go in the second argument
\floatconts
  {fig:main}
  {\caption{Overview of the proposed framework.}}
  {\includegraphics[width=0.8\linewidth]{radiomic.png}}
\end{figure}

\subsection{Problem formulation}
Let $E(\cdot)$ denote a pre-trained foundation model encoder and $E_{ft}(\cdot)$ as one of its fine-tuned variants for a specific downstream task, which both map the input patient data $x$ into a $d$-dimensional feature space. For each patient data $x$, $X^{pre} = E(x)$ and $X^{ft} = E^{ft}(x)$,
where $X^{pre} \in \mathbb{R}^d$ and $X^{ft} \in \mathbb{R}^d$ represent the features from the pre-trained and fine-tuned foundation model encoder respectively. 

For each patient data $x$, there may exist more than one data modality, for example, various image modality sequences for multi-parametric magnetic resonance imaging (mpMRI). Radiomic features are calculated for each image modality $m$ and the ROI pair, denoted as $R_m \in \mathbb{R}^{n}, m=1,2,...,M$, where $M$ denotes the total number of modalities of each patient. A set of radiomic features of the same types is calculated for each modality, resulting in $M$ $n$-dimensional vectors, $R={[R_1^\intercal, R_2^\intercal, .., R_M^\intercal]}^\intercal \in \mathbb{R}^{nM}$.

The goal is to establish a function
\begin{equation}
    f:\mathbb{R}^d \rightarrow \mathbb{R}^{nM},
\end{equation}
that project the foundation model encoder features to the corresponding radiomic features.

% The parameters of the two projection function is solved by:
% \begin{equation}
%     (\hat{\phi}, \hat{\theta}) = \arg \min_{\phi,\theta} 
% \end{equation}

\subsection{Shared non-linear projection}
\label{non-linear}
We first project encoder features into a shared hidden space by learning a shared non-linear function,
\begin{equation}
    Z = f^{share}(X;\phi)
\end{equation}
In order to learn this projection, we decompose $f$ into a shared non-linear projection and modality-specific linear heads, denoted as:
\begin{equation}
    f(X)=f^{head}(f^{share}(X;\phi),\theta).
\end{equation}
The model parameters are optimised using reconstruction loss with optional $L1$, $L2$, or elastic penalties on model weights:
\begin{equation}
    \mathcal{L} = \mathcal{L}_{rec} + \lambda_1||\phi,\theta||_1 + \lambda||\phi,\theta||_2^2.
\end{equation}
Therefore, 
\begin{equation}
    (\hat{\phi}, \hat{\theta}) = \arg \min_{\phi,\theta} \sum^M_{m=1}||f_m^{head}((f^{share}(X^{pre},\phi);\theta_m)-R_m||_1+\lambda_1||\phi,\theta||_1 + \lambda||\phi,\theta||_2^2).
\end{equation}
The first stage is optimised using features from before fine-tuning as input. Once trained, we freeze the weights of the shared function and discard the temporary heads $f^{head}_m$.
The latent features obtained from this stage are denoted as $Z^p = f^{share}(X^{pre};\hat{\phi})$ and $Z^{ft} = f^{share}(X^{ft};\hat{\phi})$.

\subsection{Closed-form linear radiomic decoding}
After transforming the features from foundation models to the shared hidden space, we solve a new linear decoder for hidden features from pre- and post- fine-tuning separately using least-squares, in a single matrix form: $R=\theta Z$. 
The optimal parameters are solved by: $ \hat{\theta}=RZ^\intercal(ZZ^\intercal)^{-1}$.

\section{Experiments}
\subsection{Dataset}
The proposed radiomic interpretation framework is evaluated on two datasets across three downstream tasks. The first dataset is a multi-study mpMRI collection from the UCL hospital, including SmartTarget \citep{hamid_smarttarget}, PICTURE \citep{simmons_picture}, ProRAFT \citep{orczyk_proraft}, Index \citep{dickinson_index}, PROMIS \citep{bosaily_promis} and PROGENY \citep{linch_progeny}. This dataset contains mpMRI from 850 patients, including T2-weighted image (T2), high-b value diffusion-weighted image (DWI), and Apparent Diffusion Coefficient (ADC) maps, with both lesion and prostate gland masks available on each T2 image. We refer to this dataset as the UCLH dataset in the following sections. The second dataset consists of prostate mpMRI with gland contour from $1,028$ patients recruited in the ReImagine Risk study \cite{marsden2021update}.

All images are resampled to voxel size of $0.5mm \times 0.5mm \times 1mm$. Each dataset is split into train, validation, and test set with a ratio of 7:1:2 on the patient level, for downstream task fine-tuning and evaluation.
\subsection{Foundation model pretraining}
We adopt a recently released prostate mpMRI foundation model, ProFound, to investigate the fine-tuning effect. ProFound uses ConvNeXt v2 \cite{woo2023convnext} and is pre-trained using masked autoencoder (MAE) \cite{he2022masked}, which is a self-supervised learning method that can be used to pre-train vision models. The model is pre-trained on an ensemble of private and public prostate mpMRI datasets of $\sim 5000$ patients, including the PI-CAI dataset \cite{saha2024artificial}, PROSTATE-MRI from the Cancer Imaging Archive \cite{Choyke_Turkbey_Merino_Wood_2025}, the ReImagine Risk dataset \cite{marsden2021update} (same as one of the aforementioned downstream dataset), and a private dataset \cite{min2025segmentation}. More details such as pretraining protocols can be found in the ProFound repository \footnote{https://github.com/pipiwang/ProFound}.
\subsection{Foundation model fine-tuning}
To investigate the feature shift from fine-tuning the pre-trained foundation model, three prostate cancer related downstream tasks were explored.

\textbf{Prostate cancer risk group classification.} We fine-tune the ProFound model to predict the Prostate Imaging Reporting and Data System (PIRADS) scores, which is formulated as a multiclass classification task with patient groups of PIRADS scores of $<3$, $3$, $4$, and $5$. In this task, the ProFound model is fine-tuned by adding a simple head comprising two fully connected layers with an intermediate batch normalisation layer. The ReImagine risk dataset is used for the classification task and the model is trained with the Cross Entropy loss.

\textbf{Prostate cancer lesion segmentation.} The pre-trained model is adapted to delineate the lesion contour by inserting a UPerNet head \cite{xiao2018unified} after the encoder. Dice loss is used for fine-tuning the segmentation task on the UCLH dataset.

\textbf{Prostate gland volume estimation.} We also explore a regression task of predicting the prostate gland volume, where a simple head consisting of a batch normalisation layer followed by a fully connected layer is adopted. ProFound is fine-tuned on the UCLH dataset using the Mean Squared Error (MSE) loss.

All fine-tuned models are trained for $100$ epochs with a learning rate of $0.001$ using the AdamW optimiser. For the classification and segmentation task, the model takes input of three modalities, T2, high-b value DWI, and ADC maps, whereas the regression task only uses T2 as the model input.

\subsection{Radiomic feature extraction}
The radiomic features are extracted following a guidance \cite{zwanenburg2016image} using PyRadiomics (ver 3.1.0) \cite{van2017computational} on all mpMRI modalities of each patient. A selection of features were extracted, including first-order features, Gray Level Co-occurrence Matrix (GLCM) features, Gray Level Size Zone Matrix (GLSZM) features, Gray Level Run Length Matrix (GLRLM) features, Neighbouring Gray Tone Difference Matrix (NGTDM) features, Gray Level Dependence Matrix (GLDM) features, from both original and Wavelet filtered images. The Min-Max normalisation is performed on each radiomic feature to scale all features to a range of $[0,1]$. 

For the lesion segmentation task, we calculate two sets of radiomics, using lesion masks and prostate gland masks as ROIs respectively. As the data in this study mostly come from patients with low-to-medium-risk cancer, using only the lesion mask would provide a very limited ROI and may exclude regions with subtle extending and/or emerging abnormalities. Including the whole-gland mask would allow us to capture broader contextual and structural information that may be relevant for distinguishing lesion-related changes, especially in early disease. For the PIRADS score classification task and the prostate volume estimation task, we use the whole gland as ROI because PIRADS rely on different primary determining sequence for different zone (peripheral zone and transitional zone), yet using only lesion mask would lose its relative spatial location information. 

\subsection{Training the shared non-linear mapping}
\sloppy To train the shared non-linear mapping $f^{share}$ (in Sect.\ref{non-linear}), we perform a parameter sweep to decide the value of $\lambda _1$ and $\lambda _2$ over the combination of $\lambda_1 \in {[0, 10^{-7}, 3\times10^{-7}, 10^{-6}, 3\times10^{-6},10^{-6}]}$ and $\lambda_2 \in {[0, 10^{-5}, 10^{-4}, 10^{-3}]}$. The final adopted values are $\lambda_1 = 10^{-6}$ and $\lambda_2 = 10^{-5}$. The shared non-linear projection mapping is trained for 200 epochs with a learning rate of $0.001$.

\subsection{Representation shift measurement}
To quantitatively measure the feature shift in representing radiomics after fine-tuning, we adopt the following metrics.

\textbf{Importance score.}
For radiomic feature $k$ of modality $m$, the importance is defined as $I_{m,k} = ||\theta_{m,k,:}||_2$.
The change after fine-tuning is:
\begin{equation}
\label{eq:delta}
    \Delta I_{m,k} = I_{m,k}^{ft} - I_{m,k}^{p}.
\end{equation}

\textbf{$R^2$ score.} The $R^2$ score is also known as Coefficient of Determination, which is defined as 
\begin{equation}
R^2 = 1 - \frac{Residual\ Sum\ of\ Squares}{Total\ Sum\ of\ Squares}.
\end{equation}
We use $R^2$ to quantify how well the features from foundation model encoder describes the radiomics information. 

\textbf{Mean Squared Error}. We also use MSE to investigate the capability of reconstructing radiomic features using the foundation model encoder representation.
We performed Wilcoxon signed-rank tests on the per-sample squared errors for each radiomic feature family on the evaluated tasks, comparing the pre-trained model with fine-tuned model.


\section{Results}
\subsection{Quantitative performance of the interpretation framework}
To assess the proposed radiomic feature representation framework, we report MSE and $R^2$ for three downstream tasks and various radiomic feature groups and all the detected statistical significances on squared errors, as shown in Tab.~\ref{tab:res}. Higher MSE and lower $R^2$ were obtained after the foundation model was adapted to specific tasks, suggesting that feature embeddings become less linearly recoverable into radiomic representations. A possible reason could be that the fine-tuned encoder extracts more specialised information, whereas the self-supervise pre-trained model captures more general information about the input images. 


The regression performance of the classification and regression task operated on the prostate gland mask for radiomics calculation. For both downstream tasks, the radiomic representation model exhibited the lowest MSE ($0.103$ and $0.206$) and the highest $R^2$ ($0.892$ and $0.785$) on NGTDM features with and without fine-tuning, indicating information about structural patterns or inflammation relevant markers \cite{aguirre2025radiomics} being encoded by the foundation model. These patterns are likely to contribute more to the model predictive capability for PIRADS score classification and volume regression. 

We evaluated the regression performance using radiomic features extracted from two ROI definitions, the lesion mask and the whole prostate gland. When radiomics were computed at the lesion level, the regression achieved low $R^2$, indicating that lesion-level features provide limited explanatory power for the encoder representation in the segmentation task. This is likely due to the high variability and small spatial extent of individual lesions, which produce radiomic descriptors with low stability and weak correlation to global encoder embeddings.
In contrast, using gland-level radiomics substantially improved the regression fit, yielding approximately $R^2\approx 0.4$. This suggests that the encoder captures information more strongly aligned with global prostate characteristics than with fine-scale lesion appearance. Gland-level attributes such as organ size, zonal anatomy, and age-related tissue changes are known to correlate with cancer presence and localisation, which may explain their stronger correspondence with encoder features. These findings also imply that lesion-specific radiomic features may be too heterogeneous or insufficiently discriminative to establish a stable mapping for this task.
For completeness and transparency, we report both ROI scenarios. Together, they illustrate that radiomics extracted at different anatomical scales provide different levels of explanatory value, and that the encoder’s behaviour in lesion segmentation is more consistently reflected in global prostate characteristics than in local lesion descriptors.
\begin{table}[htbp]
 % The first argument is the label.
 % The caption goes in the second argument, and the table contents
 % go in the third argument.
\floatconts
  {tab:res}%
  {\caption{Quantitative results showing the performance of MLP across three downstream tasks on various group of features. CLS = classification task, REG = regression task, SEG-L = segmentation task with lesion mask as radiomics ROI, SEG-P = segmentation task with prostate gland mask as radiomics ROI. Statistical significance levels are denoted by * $p < 0.05$, ** $p < 0.01$, and *** $p < 0.001$.}}%
  {\resizebox{0.9\textwidth}{!}{%
  \begin{tabular}{cclclclclc}
\toprule
\multirow{2}{*}{Feature} & \multirow{2}{*}{Stage} & \multicolumn{2}{c}{PIRADS CLS} & \multicolumn{2}{c}{Volume REG} & \multicolumn{2}{c}{Lesion SEG-L} & \multicolumn{2}{c}{Lesion SEG-P} \\ \cline{3-10}
 &  & MSE$\downarrow$ & $R^2 \uparrow$ & MSE$\downarrow$ & $R^2\uparrow$ & MSE$\downarrow$ & $R^2\uparrow$ & MSE$\downarrow$ & $R^2\uparrow$ \\ \midrule
First order & Pre-train & 0.437 & 0.584 & 0.263 & 0.727 & 0.722 & 0.344 & 0.703 & 0.351 \\
 & Fine-tune & 0.452 & 0.569 & 0.366 *** & 0.621 & 0.775 *** & 0.296 & 0.732 ** & 0.325 \\ \midrule
GLCM & Pre-train & 0.365 & 0.659 & 0.132 & 0.860 & 0.623 & 0.436 & 0.584 & 0.492 \\
 & Fine-tune & 0.390 & 0.636 & 0.269 *** & 0.716 & 0.649 ** & 0.412 & 0.613 ** & 0.464 \\ \midrule
GLDM & Pre-train & 0.326 & 0.697 & 0.162 & 0.826 & 0.625 & 0.440 & 0.593 & 0.468 \\
 & Fine-tune & 0.347 * & 0.669 & 0.260 *** & 0.719 & 0.771 *** & 0.307 & 0.620 & 0.442 \\ \midrule
GLRLM & Pre-train & 0.263 & 0.760 & 0.140 & 0.851 & 0.656 & 0.422 & 0.725 & 0.367 \\
 & Fine-tune & 0.331 *** & 0.698 & 0.227 *** & 0.760 & 0.812 *** & 0.272 & 0.746 & 0.348 \\ \midrule
GLSZM & Pre-train & 0.614 & 0.409 & 0.453 & 0.529 & 0.928 & 0.186 & 0.752 & 0.272 \\
 & Fine-tune & 0.631 & 0.393 & 0.577 *** & 0.399 & 1.006 *** & 0.116 & 0.787 *** & 0.238 \\ \midrule
NGTDM & Pre-train & 0.287 & 0.735 & 0.103 & 0.892 & 0.712 & 0.361 & 0.665 & 0.400 \\
 & Fine-tune & 0.300 ** & 0.717 & 0.206 *** & 0.785 & 0.838 *** & 0.263 & 0.735 *** & 0.336 \\ \midrule
Original & Pre-train & 0.416 & 0.602 & 0.640 & 0.335 & 0.691 & 0.311 & 0.641 & 0.368 \\
 & Fine-tune & 0.453 * & 0.571 & 0.747 *** & 0.224 & 0.810 *** & 0.192 & 0.687 *** & 0.322 \\ \midrule
Wavelet & Pre-train & 0.430 & 0.599 & 0.279 & 0.704 & 0.791 & 0.302 & 0.776 & 0.308 \\
 & Fine-tune & 0.441 & 0.585 & 0.354 *** & 0.623 & 0.837 ** & 0.259 & 0.792 & 0.293 \\ \bottomrule
\end{tabular}}}
\end{table}

In addition to reporting radiomics group-wise performance, we also investigate the regression fit on different input modalities. We show three examples in Fig.~\ref{fig:highr2}, including the PIRADS classification task and the segmentation task with two ROI definitions. Only the feature types with the highest $R^2$ after fine-tuning are illustrated as examples. It can be observed that in the PIRADS classification task, radiomics of all three modalities are aligned to the foundation model features to a substantial degree, indicating comparative predictive power of all modalities. While for the lesion segmentation task, high-b value DWI and ADC radiomics align with foundation model features while T2 bahaves the opposite, regardless of pre- or post- fine-tuning, which corresponds to the ability of ADC and high b DWI in identifying tumours by highlighting cancerous tissues with signal intensity different from normal tissues.

\begin{figure}[htb]
 % Caption and label go in the first argument and the figure contents
 % go in the second argument
\floatconts
  {fig:highr2}
  {\caption{$R^2$ of single modality on mpMRI tasks on the highest overall $R^2$ features.}}
  {\includegraphics[width=0.8\linewidth]{res-highr2.pdf}}
\end{figure}

\subsection{Qualitative case studies}

To understand how fine-tuning reshapes the encoder representation for PIRADS prediction, we examined radiomic features whose ability to explain encoder embeddings changed the most, as shown in Fig.~\ref{fig:case1}. For each radiomic descriptor, we quantified its explanatory value via $\Delta I$ calculated before and after fine-tuning, then ranked the features in three complementary ways: those that became newly important (positive $\Delta I$), those whose importance decreased (negative $\Delta I$), and those with the least absolute change among features that were globally stable. These three views reveal how fine-tuning shifts the encoder toward radiologically meaningful image characteristics used in PIRADS scoring.

\begin{figure}[htbp]
 % Caption and label go in the first argument and the figure contents
 % go in the second argument
\floatconts
  {fig:case1}
  {\caption{Radiomic feature changes for PIRADS classification tasks. The left side shows patient cases with all modalities and the prostate gland ROI, and right side lists features with the top and least five $\Delta I$.}}
  {\includegraphics[width=\linewidth]{res_topk.pdf}}
\end{figure}

\textbf{Features gaining importance: increased alignment with T2 structural patterns.} Radiomic features with the largest positive $\Delta I$ were predominantly T2-weighted texture and run-length measures, including GLCM-MCC, GLCM-correlation, and several GLRLM descriptors capturing long high-intensity runs or low-intensity structural streaks. These features quantify the coherence, organisation and zonal architecture of the prostate, for example in the peripheral and transition zones. PIRADS guidelines place a strong emphasis on these T2 features, as lesion visibility and morphological distortion on T2-weighted imaging are central markers of clinical suspicion. The increased ability of these descriptors to explain the encoder after fine-tuning indicates that the model becomes more attuned to the structured appearance of malignant regions and to deviations from normal glandular texture patterns. This shift suggests that fine-tuning makes the encoder more aligned with radiologists’ use of T2 structural cues for PIRADS assessment.

\textbf{Features losing importance: reduced reliance on unstable diffusion heterogeneity.} Radiomic features with the strongest negative $\Delta I$ primarily originated from ADC and high-b diffusion imaging. These include ADC-GLCM-Imc2, ADC-GLCM-DifferenceEntropy, ADC-GLDM-DNUN, and high-b kurtosis, all of which characterise fine-scale texture irregularity and local signal heterogeneity. While such patterns may loosely correlate with tumour presence, they are also known to be sensitive to acquisition noise, variation in b-values and small ROI instability, and they are not central to PIRADS scoring, which emphasises consistent diffusion restriction rather than stochastic heterogeneity. The drop in explanatory power after fine-tuning suggests that the encoder moves away from these volatile cues, instead prioritising more robust diffusion features. This behaviour reflects the goal of fine-tuning: to refine the model toward radiologically reliable indicators of high PIRADS scores and to suppress spurious correlations.

\textbf{Features with low shifts: stable global ADC and T2 indicators.} Among radiomic features that explained a substantial portion of encoder variance both before and after fine-tuning, those with the lowest absolute changes while maintaining moderate to high importance score included global ADC intensity descriptors (TotalEnergy, Energy) and T2 gray-level distribution measures (GLSZM-GLNUN, GLSZM-Variance). These metrics quantify overall diffusion signal level and non-uniformity, as well as global heterogeneity across the gland. These are radiologically meaningful biomarkers: PIRADS scoring heavily relies on diffusion restriction (low ADC) and lesion conspicuity cross-correlated across T2 and diffusion sequences. These stable features correspond to fundamental anatomical or textural characteristics that provide contextual structure but are not strongly task-discriminative for PIRADS scoring.


Using our proposed approach, across all the analyses, fine-tuning produces a systematic, clinically interpretable reorganisation of encoder features. The encoder strengthens its alignment with zonal T2 textural structure, reduces sensitivity to noise-prone diffusion heterogeneity, and retains the weighting of global ADC/T2 intensity and non-uniformity—all of which mirror established criteria in PIRADS scoring. These results show that radiomics provides a meaningful, interpretable lens through which fine-tuning behaviour can be understood, demonstrating that the model becomes progressively more “radiologist-like” in the cues it uses to assess prostate cancer suspicion.

\section{Discussion}
Radiomic features are known to be correlated or measure overlapping aspects of image texture and intensity, however, in this specific study, our goal is not to construct a minimal or decorrelated feature set, but to use these features as descriptive markers to monitor distributional shifts before and after the fine-tuning process. In this context, correlation among features does not diminish the value of the intended objectives, because it is not expected to use these features for predictive modeling or inference. Instead, any feature that reflects a change induced by fine-tuning is informative for our purpose. To mitigate potential instability arising from collinearity, we incorporate both $L1$ and $L2$ regularization within our methods. 

Radiomic features also vary in their degree of interpretability. While some descriptors are less intuitive at a clinical level, they are still substantially more interpretable than most deep learning features, which are typically abstract latent representations without any human-interpretable incentives. Future work could benefit from identifying and selecting a more interpretable subset of radiomic features for characterising fine-tuning effects. 

We acknowledge that the presence of radiomic features in the embeddings does not guarantee their usefulness for downstream tasks. Therefore, we also report downstream results for both 1) models with a frozen backbone and trained task-specific head, and 2) models with both backbone and head fine-tuned in the Appendix. These correspond directly to the pre- and post- fine-tuning embeddings used in our radiomic analysis, and enable a more direct link between representation changes and downstream task performance. Notably, across all evaluated tasks, fine-tuning consistently yields improved downstream performance.

All experiments in this study were conducted using ProFound, which served as a concrete example for applying our radiomic analysis framework. While our methodological approach is model-agnostic and, in principle, applicable to any foundation model, we acknowledge that the specific feature-level findings reported here are likely influenced by the particular pretraining data, architecture, and downstream tasks used. As such, we do not claim that specific feature-level conclusions are expected to generalise further. For example, fine-tuning effects may vary for models pretrained on prostate MR images versus chest CT images, or for tasks such as segmentation versus classification. Nevertheless, although a much larger-scale study is required, understanding these differences or identifying potential feature shifts that remain invariant to pretraining, domain, or task remains an important future direction.

\section{Conclusion}
This study introduces a radiomics-based framework for interpreting how foundation model representations change during fine-tuning, offering a quantitative and clinically meaningful lens on encoder behaviour. Across three downstream prostate MRI tasks, we showed that radiomic features can partially reconstruct encoder embeddings, with the best alignment observed for, in particular, at gland-ROI-level radiomics and for modality–feature combinations consistent with radiological practice (e.g., high-b and ADC for lesion identification, global features for cancer risk). By comparing linear decoding weights before and after fine-tuning, our method revealed systematic and task-dependent shifts, for example increased sensitivity to zonal T2 structure for PIRADS prediction, reduced reliance on unstable diffusion heterogeneity and stable weighting of global ADC/T2 signal characteristics.

While the radiomics-to-latent mapping explains only a fraction of encoder variance, this limitation reflects the complementary nature of hand-crafted radiomics and high-capacity foundation models. Future work may explore richer interpretable feature spaces, non-linear or sparsity-aware decoding and cross-task comparisons to establish a broader taxonomy of fine-tuning-induced representation changes. Overall, our findings demonstrate that radiomics provides a practical and principled interpretability tool, enabling foundation models to be probed, compared, adapted and potentially better understood with greater transparency in medical imaging applications.


% This is where the content of your paper goes.  Some random
% notes\footnote{Random footnote are discouraged}:
% \begin{itemize}
% \item You should use \LaTeX \cite{Lamport:Book:1989}.
% \item JMLR/PMLR uses natbib for references. For simplicity, here, \verb|\cite|  defaults to
%   parenthetical citations, i.e. \verb|\citep|. You can of course also
%   use \verb|\citet| for textual citations.
% \item Eprints such as arXiv papers can of course be cited \cite{Hinton:arXiv:2015:Distilling}. We recomend using a \verb|@misc| bibtex entry for these as shown in the sample bibliography.
% \item You should follow the guidelines provided by the conference.
% \item Read through the JMLR template documentation for specific \LaTeX
%   usage questions.
% \item Note that the JMLR template provides many handy functionalities
% such as \verb|\figureref| to refer to a figure,
% e.g. \figureref{fig:example},  \verb|\tableref| to refer to a table,
% e.g. \tableref{tab:example} and \verb|\equationref| to refer to an equation,
% e.g. \equationref{eq:example}.
% \end{itemize}

% \begin{table}[htbp]
%  % The first argument is the label.
%  % The caption goes in the second argument, and the table contents
%  % go in the third argument.
% \floatconts
%   {tab:example}%
%   {\caption{An Example Table}}%
%   {\begin{tabular}{ll}
%   \bfseries Dataset & \bfseries Result\\
%   Data1 & 0.12345\\
%   Data2 & 0.67890\\
%   Data3 & 0.54321\\
%   Data4 & 0.09876
%   \end{tabular}}
% \end{table}

% \begin{figure}[htbp]
%  % Caption and label go in the first argument and the figure contents
%  % go in the second argument
% \floatconts
%   {fig:example}
%   {\caption{Example Image}}
%   {\includegraphics[width=0.5\linewidth]{example-image}}
% \end{figure}

% \begin{algorithm2e}
% \caption{Computing Net Activation}
% \label{alg:net}
%  % older versions of algorithm2e have \dontprintsemicolon instead
%  % of the following:
%  %\DontPrintSemicolon
%  % older versions of algorithm2e have \linesnumbered instead of the
%  % following:
%  %\LinesNumbered
% \KwIn{$x_1, \ldots, x_n, w_1, \ldots, w_n$}
% \KwOut{$y$, the net activation}
% $y\leftarrow 0$\;
% \For{$i\leftarrow 1$ \KwTo $n$}{
%   $y \leftarrow y + w_i*x_i$\;
% }
% \end{algorithm2e}

\clearpage  % Acknowledgements, references, and appendix do not count toward the page limit (if any)
% Acknowledgments---Will not appear in anonymized version
\midlacknowledgments{
This work was supported by the National Institute for Health Research (NIHR) University College London Hospitals (UCLH) Biomedical Research Centre (BRC). This work was also supported by the International Alliance for Cancer Early Detection, an alliance between Cancer Research UK [C28070/A30912; C73666/A31378], Canary Center at Stanford University, the University of Cambridge, OHSU Knight Cancer Institute, University College London and the University of Manchester.
}


\bibliography{midl26_181}


\appendix
\section{Appendix}
\label{ap}
\begin{table}[h]
\centering
\caption{Downstream task results for both models where the backbone is frozen and only the task-specific head is trained (named after ``Pre-trained" below), and models where both the backbone and head are fine-tuned (named after ``Fine-tuned"). CLS = classification task, REG = regression task, SEG = segmentation task, QWK = Quadratic Weighted Kappa.}
\label{tab:resapp}
\resizebox{0.5\textwidth}{!}{%
\begin{tabular}{llll}
\toprule
\multirow{2}{*}{} & PIRADS CLS & Volume REG & Lesion SEG \\ \cline{2-4} 
 & QWK $\uparrow$ & MSE $\downarrow$ & Mean Dice $\uparrow$ \\ \midrule
Pre-trained & 0.118 & 0.007 & 0.399 \\
Fine-tuned & 0.326 & 0.004 & 0.429 \\ \bottomrule
\end{tabular}%
}
\end{table}

% \begin{table}[htbp]
%  % The first argument is the label.
%  % The caption goes in the second argument, and the table contents
%  % go in the third argument.
% \floatconts
%   {tab:res}%
%   {\caption{Quantitative results showing the performance of MLP across three downstream tasks on various group of features. CLS = classification task, REG = regression task, SEG-L = segmentation task with lesion mask as radiomics ROI, SEG-P = segmentation task with prostate gland mask as radiomics ROI}}%
%   {\resizebox{0.8\textwidth}{!}{%
%   \begin{tabular}{cccccccccc}
% \toprule
% \multirow{2}{*}{Feature} & \multirow{2}{*}{Stage} & \multicolumn{2}{c}{PIRADS CLS} & \multicolumn{2}{c}{Volume REG} & \multicolumn{2}{c}{Lesion SEG-L} & \multicolumn{2}{c}{Lesion SEG-P} \\ \cline{3-10}
%  &  & MSE$\downarrow$ & $R^2 \uparrow$ & MSE$\downarrow$ & $R^2\uparrow$ & MSE$\downarrow$ & $R^2\uparrow$ & MSE$\downarrow$ & $R^2\uparrow$ \\ \midrule
% First oder & Pre-train & 0.463 & 0.470 & 0.547 & 0.390 & 0.808 & 0.085 & 0.638 & 0.241 \\
%  & Fine-tune & 0.468 & 0.447 & 0.568 & 0.366 & 0.815 & 0.068 & 0.673 & 0.209 \\ \midrule
% GLCM & Pre-train & 0.403 & 0.578 & 0.451 & 0.474 & 0.697 & 0.087 & 0.578 & 0.187 \\
%  & Fine-tune & 0.416 & 0.547 & 0.459 & 0.467 & 0.740 & 0.044 & 0.605 & 0.146 \\ \midrule
% GLDM & Pre-train & 0.342 & 0.615 & 0.485 & 0.466 & 0.771 & -0.096 & 0.612 & 0.185 \\
%  & Fine-tune & 0.378 & 0.587 & 0.485 & 0.466 & \textbf{0.751}$\downarrow$ & \textbf{-0.091}$\uparrow$ & 0.635 & 0.157 \\ \midrule
% GLRLM & Pre-train & 0.347 & 0.614 & 0.456 & 0.474 & 0.796 & -0.152 & 0.576 & 0.166 \\
%  & Fine-tune & 0.371 & 0.591 & 0.473 & 0.448 & 0.805 & -0.166 & 0.581 & 0.159 \\ \hline
% GLSZM & Pre-train & 0.691 & 0.277 & 0.971 & 0.042 & 0.883 & -0.218 & 0.869 & 0.098 \\
%  & Fine-tune & 0.708 & 0.252 & \textbf{0.887}$\downarrow$ & \textbf{0.124}$\uparrow$ & \textbf{0.839}$\downarrow$ & \textbf{-0.152}$\uparrow$ & 0.895 & 0.078 \\ \midrule
% NGTDM & Pre-train & 0.341 & 0.613 & 0.350 & 0.587 & 0.789 & -0.117 & 0.566 & 0.241 \\
%  & Fine-tune & \textbf{0.317}$\downarrow$ & \textbf{0.635}$\uparrow$ & 0.419 & 0.506 & 0.861 & -0.118 & 0.628 & 0.158 \\ \midrule
% Original & Pre-train & 0.564 & 0.362 & 0.682 & 0.242 & 1.000 & -0.086 & 0.733 & 0.282 \\
%  & Fine-tune & 0.574 & 0.345 & 0.688 & 0.234 & \textbf{0.950}$\downarrow$ & \textbf{-0.042}$\uparrow$ & 0.784 & 0.234 \\ \midrule
% Wavelet & Pre-train & 0.433 & 0.525 & 0.507 & 0.438 & 0.772 & -0.048 & 0.665 & 0.126 \\
%  & Fine-tune & \textbf{0.426}$\downarrow$ & \textbf{0.533}$\uparrow$ & 0.539 & 0.403 & \textbf{0.755}$\downarrow$ & \textbf{-0.017}$\uparrow$ & \textbf{0.651}$\downarrow$ & \textbf{0.142}$\uparrow$ \\ \bottomrule
% \end{tabular}}}
% \end{table}

% \section{Proof of Theorem 1}

% This is a boring technical proof of
% \begin{equation}\label{eq:example}
% \cos^2\theta + \sin^2\theta \equiv 1.
% \end{equation}

% \section{Proof of Theorem 2}

% This is a complete version of a proof sketched in the main text.

\end{document}
