\documentclass{midl} % Include author names
% \documentclass[anon]{midl} % Anonymized submission

% The following packages will be automatically loaded:
% jmlr, amsmath, amssymb, natbib, graphicx, url, algorithm2e
% ifoddpage, relsize and probably more
% make sure they are installed with your latex distribution

\usepackage{mwe} % to get dummy images

\jmlryear{2024}
\jmlrworkshop{Full Paper -- MIDL 2024}
\jmlrvolume{-- 057}
\editors{Accepted for publication at MIDL 2024}

\title[ThickV-Stain]{ThickV-Stain: Unprocessed Thick Tissues Virtual Staining for Rapid Intraoperative Histology}

 % Use \Name{Author Name} to specify the name.
 % If the surname contains spaces, enclose the surname
 % in braces, e.g. \Name{John {Smith Jones}} similarly
 % if the name has a "von" part, e.g \Name{Jane {de Winter}}.
 % If the first letter in the forenames is a diacritic
 % enclose the diacritic in braces, e.g. \Name{{\'E}louise Smith}

 % Two authors with the same address
 % \midlauthor{\Name{Author Name1} \Email{abc@sample.edu}\and
 %  \Name{Author Name2} \Email{xyz@sample.edu}\\
 %  \addr Address}

 % Three or more authors with the same address:
 % \midlauthor{\Name{Author Name1} \Email{an1@sample.edu}\\
 %  \Name{Author Name2} \Email{an2@sample.edu}\\
 %  \Name{Author Name3} \Email{an3@sample.edu}\\
 %  \addr Address}


% Authors with different addresses:
% \midlauthor{\Name{Author Name1} \Email{abc@sample.edu}\\
% \addr Address 1
% \AND
% \Name{Author Name2} \Email{xyz@sample.edu}\\
% \addr Address 2
% }

%\footnotetext[1]{Contributed equally}

% More complicate cases, e.g. with dual affiliations and joint authorship
\midlauthor{\Name{Lulin Shi\midljointauthortext{Contributed equally}\nametag{$^{1}$}} \Email{lshiao@connect.ust.hk}\\
\Name{Xingzhong Hou\midlotherjointauthor\nametag{$^{2}$}} \Email{houxingzhong@ict.ac.cn}\\
\Name{Ivy H. M. Wong\nametag{$^{1}$}} \Email{hmwongal@connect.ust.hk}\\
\Name{Simon C. K. Chan\nametag{$^{1}$}} \Email{ckchanbq@connect.ust.hk}\\
\Name{Zhenghui Chen\nametag{$^{1}$}} \Email{zchenef@connect.ust.hk}\\
\Name{Claudia T. K. Lo\nametag{$^{1}$}} \Email{ketkloae@ust.hk}\\
\Name{Terence T. W. Wong\midljointauthortext{Corresponding author}\nametag{$^{1}$}} \Email{ttwwong@ust.hk}\\
\addr $^{1}$ Translational and Advanced Bioimaging Laboratory, Department of Chemical and Biological Engineering, The Hong Kong University of Science and Technology, Hong Kong, China \\
\addr $^{2}$ State Key Laboratory of Computer Architecture, Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China\\
}

\begin{document}

\maketitle

\begin{abstract}
Virtual staining has shown great promise in realizing a rapid and low-cost clinical alternative for pathological examinations, eliminating the need for chemical reagents and laborious staining procedures. However, most of the previous studies mainly focus on thin slice samples, which still require tissue sectioning and are unsuitable for intraoperative use. In this paper, we propose a multi-scale model to virtually stain label-free and slide-free biological tissues, allowing hematoxylin- and eosin- (H\&E) staining generation in less than a minute for an image with 100 million pixels. We name this ThickV-Stain model, specifically developed to virtually stain intricated and unprocessed thick tissues. We harness the ability of a multi-scale network to encourage the model to capture multiple-level micromorphological characteristics from low-resolution images. Experimental results highlight the advantages of our method for virtual staining on unprocessed thick samples. We also show the effectiveness of ThickV-Stain on thin sections, showing generalizability to other clinical workflows. The proposed method enables us to obtain virtually stained images from unstained samples within minutes and can be seamlessly integrated with downstream pathological analysis tasks, providing an efficient alternative scheme for intraoperative assessment as well as general pathological examination.
\end{abstract}

\begin{keywords}
Virtual staining, deep learning, label-free imaging, unprocessed biological tissues
\end{keywords}

\section{Introduction}
\label{sec:introduction}

\begin{figure}[!t]
% \floatconts
{\centerline{\includegraphics[width=0.85\textwidth]{figures/1.pdf}}}
{\caption{Histological examination workflow comparison. }}
{\label{fig1}}
\end{figure}

Histological examination is regarded as the gold standard for cancer diagnoses, which aims to determine whether there are any lesions or analyze the tissue microenvironment \cite{gurcan2009histopathological}. However, routine histological staining is chemical reagent-dependent and usually takes several days for sample preparation, heavily limiting their applications on rapid histopathology, especially intraoperative tissue examination \cite{maloney2018introreview}. Although the frozen section has been considered as an alternative for rapid pathological diagnosis to guide tumor resection in surgery, frozen samples are unstable and easily introduce some artifacts during rapid freezing, making diagnosis difficult or even misdiagnosed \cite{taxy2009frozen}. With the development of section-free imaging techniques, unprocessed thick tissue samples can be visualized in grayscale images without sectioning procedures \cite{fereidouni2017muse, glaser2017lightsheet}. The use of label-free or stain-free microscopes is not a routine diagnostic workflow for pathologists, and it is difficult for pathologists to interpret the biological changes with the grayscale images acquired through this method.

The emergence of virtual staining has provided a novel solution for achieving rapid histology. It refers to the digital transformation or generation of histological stains through computer algorithms \cite{bai2023uclareview}. There are some studies on the image transformation from H\&E staining to special or immunohistochemistry (IHC) staining \cite{liu2021tmi, de2021HE2sepcial, lahiani2019seamless, vasiljevic2021towards, lahiani2020seamless, xu2020HE2IHC} and image generation from unstained thin sections \cite{rivenson2019uclanature, rivenson2019uclaphasestain, zhang2020uclamultistain, li2020carotidstain, Li2021utom, meng2021Ovarian, shi2023isbi}. Although the existing virtual staining studies have achieved impressive performance, they mainly rely on well-prepared thin slices, and the acquisition and preparation of these thin slices are still cumbersome and time-consuming (as shown in Figure \ref{fig1}a), which is unsuitable for intraoperative tissue diagnosis. Therefore, this paper does not focus on image translation from the existing staining or unstained thin sections but focuses on virtual H\&E staining from sectioning-free and label-free tissues.

In this paper, we investigate directly using autofluorescence (AF) microscopy \cite{zhang2022champ}, to obtain AF images of unprocessed thick samples, which does not necessitate tissue embedding, sectioning, and dewaxing (Figure \ref{fig1}c). Our objective is to convert the acquired grayscale images into pathologist-interpretable images. Additionally, we evaluated that the virtually stained images can further be used for automatic tumor diagnosis. The whole procedure of the proposed pipeline can be completed within several minutes with minimal tissue preparation. In comparison to the frozen section (Figure \ref{fig1}b), our method is faster and non-destructive to tissues. In brief, the key contributions of this paper are as follows: 1). We propose a ThickV-Stain model \footnote{Code and model are available at \url{https://github.com/TABLAB-HKUST/ThickV-Stain}.} for complicated unprocessed bio-samples. 2). The first proposal to use a multi-scale generator for virtual staining from low-quality input images. 3). SOTA performance on both thick tissue and thin section data.



\section{Method}
\label{sec:Method}
\subsection{Research Problem}

\begin{figure}[!t]
\centerline{\includegraphics[width=0.86\linewidth]{figures/2.pdf}}
\centering
\caption{Comparison between thick samples and thin sections. (a) The multi-layer information due to the deeper imaging depth inevitably degrade the image quality. (b) Morphological differences between AF of thick tissue and H\&E-stained image.}
\label{fig3}
\end{figure}

The research problem is the automatic translation from grayscale AF images of thick samples to histologically stained images, which can be easily integrated with other downstream tasks (e.g., tumor detection, and report generation), enabling rapid intraoperative diagnosis. 

The first challenge here is the low image quality of AF input. In slide-free microscopy, AF images from thick specimens suffer lower molecular contrast and are blurrier. This is due to the lack of optical sectioning capability in the slide-free imaging system and multi-layer information would be captured at the same time. From Figure \ref{fig3}a, we can see that the image quality and resolution of the thick samples are relatively poor when compared with that of thin tissue slices. Therefore, it is much more challenging to recognize and transform those indistinguishable components from images of unprocessed thick specimens. As shown in Figure \ref{fig3}a, cell nuclei arranged in adenocarcinoma acinar structure can be observed in the AF of the thin section while no obvious related features are shown in the AF of thick tissues. Hence, it poses a huge challenge to learn the correct mapping between two domains.

Another barrier is that it is not possible to obtain aligned chemically stained images with unstained images for model training as histological staining will only be carried out on a thin slide. In this situation, after acquiring scanned images of unprocessed and unstained thick samples, only the scanned surface would be sectioned and stained for reference. Since AF images of thick samples contain multiple-layer information, there will be a considerable morphological difference between the AF images and the chemically stained versions (Figure \ref{fig3}b). Unsupervised learning is required when there is no paired ground truth. Current unsupervised virtual staining methods mainly exploit cycleGAN as the basic architecture \cite{zhu2017cyclegan}. \cite{Li2021utom} shows that the cycleGAN can hardly distinguish the background and tissue context towards the virtual staining of complicated human samples. This is because the cycle-consistency loss cannot guarantee semantic rationality. Even though the semantic change on the model output image is incorrect, the reconstructed one can be recovered perfectly due to the loss. Some work also reported that cycle consistency loss plays an indispensable role in key structure preservation of input images \cite{pumarola2018ganimation}, but weak constraints between the translated output and ground truth \cite{liu2021tmi}. To resolve this ambiguity, some researchers have tried to use saliency mask \cite{Li2021utom} and region labels \cite{shi2022oneside} as semantic guidance for virtual staining.

In our case, it is quite challenging to extract the consistent saliency mask or region label due to the limited image contrast. We address the above challenges with the multi-scale generator. We claim to use a multi-scale model to explore sufficient information for a better understanding of the complex data, which does not require additional supervision or manual annotations. We aim to use different scales focusing on different histological patterns according to the receptive field size and capturing multi-level representations. 


\subsection{ThickV-Stain: Thick Biological Tissues Virtual Staining}
\label{subsec:generator}

\begin{figure}[!t]
\centerline{\includegraphics[width=0.61\linewidth]{figures/3.pdf}}
\centering
\caption{Overview of the proposed ThickV-Stain Generator. The multi-scale U-Nets share the same parameters.}
\label{fig4}
\end{figure}

To have special attention to learning multi-structural features, we propose a novel multi-scale generator as shown in Figure \ref{fig4}. It consists of three U-Net modules with the same convolution kernel size (4 × 4) but with different receptive fields due to different input image resolutions. The top branch in Figure \ref{fig4} captures more detailed histological features, such as cell nuclei. This is because the convolution kernel of this module will perceive small objects in the input resolution. Conversely, the bottom one can perceive a large field as the original image is scaled down, such as global information of edges and background. 

The U-Net architecture used in this paper consists of an encoder and a decoder network. The encoder involves 5 convolution layers and the decoder consists of 5 fractionally-strided convolution layers that upsample the feature maps to the original spatial dimensions. The feature maps from the encoder with the corresponding ones from the decoder are connected by skip connections to preserve the spatial information from the input. Following the U-Net, the outputs from the two additional scales are resized to the original size of the input image and then concatenated to get the final output. The form of the output can be expressed as:

\begin{equation}
G(x)=conv([ U_{1} (x),R(U_{2} (x)),R(U_{3} (x))])  
\end{equation}

where $[\cdot]$ refers to the concatenation operator, $U_{i}$ represents the $i$-th branch. $R(\cdot)$ denotes the bicubic interpolation function to change the size of images. We use 2 resize blocks here to achieve the increase of two additional scales (H/2, W/2) and (H/4, W/4).

To avoid mode collapse caused by the imbalance design between the generator and discriminator, we also use a multi-scale discriminator \cite{wang2018pix2pixHD}. The input image is processed at three scales, with each scale being processed by a separate network. Those three discriminator networks have an identical structure but operate at different image scales. The output of each network is then combined to produce a final score. 

Besides GAN loss \cite{goodfellow2020gan}, we further use identity loss \cite{taigman2016identity} for better structure preserving. The overall loss functions are shown below:

\begin{equation}
\mathcal L^{G}_{adv} = - \mathbb{E}_{x}[ log D(G(x))]
\end{equation}
\begin{equation}
\mathcal L^{D}_{adv} = \mathbb{E}_{x}[log D(G(x))] + \mathbb{E}_{y}[log(1 - D(y))]
\end{equation}
\begin{equation}
\mathcal L_{idt}=\mathbb{E}_{y} \left \| y-G(y) \right \| _{1}
\end{equation}
\begin{equation}
\mathcal L = \mathcal L_{adv} + \lambda \mathcal L_{idt}
\label{equ5}
\end{equation}



\section{Experiments and results}
\subsection{Dataset}
\label{subsec: dataset}
The data used in this paper were collected from 14 patients and involved various lung adenocarcinoma subtypes. The H\&E-stained slices used for training were cut from the imaged thick sample surface. Due to the megapixels of whole slide images (WSIs, $\sim$20,000 × $\sim$20,000), we randomly sampled 10,000 small image patches per epoch with the size of 256 × 256 from seven patients for training. During testing, each WSI of the remaining seven patients’ data was split into 256 × 256 images with 16-pixel overlap to avoid artifacts, and the test cohort included 31,317 image patches (thick sample data used in section \ref{subsec:results1}) and 22,283 image patches (thin section data used in section \ref{subsec:results2}).

\subsection{Implementation Details}
\label{subsec: Details}
The overall network was implemented in PyTorch on a single NVIDIA GeForce RTX 3090 GPU. We used the architecture of U-Net in each scale forming our generator and multi-scale discriminator based on the pix2pixHD. We trained our model with the Adam optimizer (with $\beta_{1}$ = 0.5, $\beta_{2}$ = 0.999). The initial learning rate was set to 2 × $10^{-4}$ for the generator, and 1 × $10^{-4}$ for the discriminator with a linear decay scheduled after 15,000 iterations. The different learning rate was designed to avoid mode collapse due to the fast convergence of the discriminator. The batch size was set to 16. The $\lambda$ in \ref{equ5} is set to 5.


\subsection{Experiment on Thick Tissue Data}
\label{subsec:results1}

In this paper, we chose the commonly used unsupervised I2I architectures, including cycleGAN, CUT, and a seminal virtual staining model (UTOM), as the baseline models. The visual comparison is shown in Figure \ref{fig6}. Compared to the AF image, the H\&E staining (1$^{st}$ column) can only visualize some surface structure of the sample, providing a basic reference rather than an exact ground truth.
\begin{figure}[!t]
\centerline{\includegraphics[width=\textwidth]{figures/4.pdf}}
\centering
\caption{Comparison results on thick tissues. The 1$^{st}$ column is traditional H\&E staining of a thin slice sectioned from the imaged surface of thick tissue (2$^{nd}$ column).}
\label{fig6}
\end{figure}

\begin{table}[!t]
    \centering
    \caption{Quantitative evaluation with different methods.}
    \resizebox{0.85\linewidth}{0.75in}{
    \begin{tabular}{c|c|c|c|c|c}
    \hline
        \multicolumn{2}{c|}{} & {\textbf{CycleGAN}} & \textbf{CUT} & \textbf{UTOM} & \textbf{ThickV-Stain} \\ \hline 
        \textbf{Thick} & FID↓ & 97.24 $\pm$ 5.88	& 97.26 $\pm$ 24.37	& 62.00 $\pm$ 6.88	& \textbf{36.71 $\pm$ 3.27} \\ 
                       
                       & KID↓ & 0.06 $\pm$ 0.01 & 0.06 $\pm$ 0.02 & 0.03 $\pm$ 0.01 & \textbf{0.01 $\pm$ 0.01}	\\
                       
                      & T-MSE↓ & 1.00 $\pm$ 0.05 & \textbf{0.92 $\pm$ 0.04} & 1.06 $\pm$ 0.19 & 0.95 $\pm$ 0.02	\\ \hline
                      
        \textbf{Thin} & FID↓ & 45.21 $\pm$ 4.37 & 61.12 $\pm$ 1.39 & 95.13 $\pm$ 31.00 & \textbf{19.28 $\pm$ 1.57} \\
        
                      & KID↓ & 0.02 $\pm$ 0.00 & 0.05 $\pm$ 0.01 & 0.05 $\pm$ 0.02 & \textbf{0.01 $\pm$ 0.00} \\ 
                      
                      & SSIM↑ & 0.54 $\pm$ 0.07 & 0.29 $\pm$ 0.00 & 0.46 $\pm$ 0.07 & \textbf{0.61 $\pm$ 0.02} \\
                      & PSNR↑ & 14.33 $\pm$ 0.07 & 13.53 $\pm$ 0.04 & 15.74 $\pm$ 1.70 & \textbf{17.82 $\pm$ 0.07}
                       \\ 
                     & MSE↓ (×$10^{2}$) & 24.17 $\pm$ 0.35 & 29.03 $\pm$ 0.31 & 19.05 $\pm$ 8.11 & \textbf{11.05 $\pm$ 0.13} \\\hline

    \end{tabular}}
    \label{tab1}
\end{table}


\begin{table}[!t]
    \centering
    \caption{Professional assessment average score on test slides from two pathologists. The result is rated from 0–5. Higher scores represent better quality. }
    \resizebox{\linewidth}{0.53in}{
    \begin{tabular}{c|c|c|c|c|c}
    \hline
          & \multicolumn{2}{|c|}{\textbf{Visual quality}} & \multicolumn{3}{|c}{\textbf{Pathological features}} \\ 
          \cline{2-6}
          
          & \textbf{Fidelity} & \textbf{Accuracy} & \textbf{Nuclei} & \textbf{Extracellular fibrosis} & \textbf{Overall} \\ \hline
        CycleGAN & 2.07	& 1.54	& 2.39	& 1.36	& 1.57 \\ 
        CUT & 2.79 & 2.79 & 2.36 & 2.11	& 2.54 \\ 
        UTOM & 4.11 & 2.86 & 2.29 & 2.43 & 3.00 \\ 
        \textbf{ThickV-stain} & \textbf{4.61} & \textbf{3.43} & \textbf{2.79} & \textbf{3.18} & \textbf{3.82}\\ \hline
    \end{tabular}}
    \label{tab2}
\end{table}
 

In the 2$^{nd}$ row (marked with blue arrow), there are obvious pathological features of fibrosis in our results. From the 3$^{rd}$ row, the major tumor component consisting of solid sheets can be observed in our results (marked with yellow dashed lines). The same structure can also be observed in H\&E-stained reference image. Even though UTOM also draws a correct outline, it misses cell nuclear information within the outline. Both CUT and cycleGAN mistranslate the background areas, which is consistent with \cite{Li2021utom}. To evaluate the image quality quantitatively, we calculate the Fréchet Inception Distance (FID) \cite{heusel2017fid} and Kernel Inception Distance (KID) \cite{binkowski2018kid}. The results are shown in Table \ref{tab1}, where ThickV-Stain achieves the best FID score (36.71). UTOM and cycleGAN are better than CUT, showing the same trend with visual analysis. 

To explore whether our virtual staining meets clinical needs, we invited two pathologists to score our virtually stained images. The evaluation metrics are from two aspects: the pathological properties and visual quality. We followed the setting from \cite{rivenson2019uclanature} to evaluate nuclei details, extracellular fibrosis, and overall staining quality. Regarding the visual quality, fidelity refers to whether any artifacts in the stained image can affect the image quality and accuracy refers to whether the pathological diagnosis (e.g., the location of the tumor region) from virtually stained images is consistent with the real staining. The evaluation results in Table \ref{tab2} show that our model significantly outperforms other baseline models. The results of cycleGAN and CUT provide limited useful information to the pathologist, which is consistent with our analysis of visual results. 

Moreover, we apply a lung adenocarcinoma detection model for automatic tumor region detection with our virtually stained results. \cite{wang2018scientifre} use human lung adenocarcinoma cancer data, which is consistent with our case. Here, we apply the trained model on both generated images and real H\&E images to see if our virtual stained results can show consistent diagnostic conclusions with real staining. In addition, the MSE between the two tumor probability maps, noted T-MSE, can be used to evaluate the potential of virtually stained results in real clinical practice. The comparative results can be found in Table \ref{tab1}, and a visual example can be found in Appendix Figure \ref{fig5}.


\subsection{Experiment on Thin Slice Data}
\label{subsec:results2}
We also validate the extensibility of the proposed method on other clinical workflows. Moreover, the ground truth is accessible for the virtual staining of thin sections, which can provide an accurate evaluation of the model performance. It can be observed that ThickV-Stain (Figure \ref{fig7}c) outperforms other baseline models on unstained thin slices compared with ground truth (Figure \ref{fig7}b). As for quantitative measures, we chose the structural similarity index measure (SSIM), peak signal-to-noise ratio (PSNR), and MSE, as metrics because ground truth can be obtained for thin-section virtual staining. The numerical results are shown in Table \ref{tab1}. Regarding PSNR and MSE, ThickV-Stain and UTOM are relatively close, and CUT are inferior to the other models. As for the FID and KID scores computed on the test set, ThickV-Stain significantly outperforms other models.

\begin{figure}[!t]
\centerline{\includegraphics[width=0.95\textwidth]{figures/5.pdf}}
\centering
\caption{Virtual staining results on thin sections. (a) Input AF. (b) Real H\&E staining. (c) ThickV-Stain. (d) UTOM. (e) CUT. (f) CycleGAN.}
\label{fig7}
\end{figure}


\subsection{Ablation Study}
\label{subsec:ablation}
\begin{figure}[!t]
\centerline{\includegraphics{figures/6.pdf}}
\centering
\caption{Ablation study. The tumor regions are marked manually with purple lines.}
\label{fig8}
\end{figure}

In this paper, we claim that the virtual staining performance on complicated dataset, especially unprocessed thick tissue, is limited if the model cannot represent complex features adequately. To explore the importance of the multi-scale model for virtual staining of complicated thick samples, we carried out an ablation study on multi-scale generator. 

From Figure \ref{fig8}, we can see that for virtual staining of thin section data, even a single-scale generator can also perform well. It achieves correct translation where the same cancerous patterns and fibrosis can be observed, with only slight degradation in image quality compared with the multi-scale generator. And there is no significant difference in the FID results (20.29 and 21.74). We analyze this because the AF of thin sections are of such high quality that even a single scale model is sufficient to correctly transform the image features. In this case, multi-scale does not have obvious advantages when dealing with simple data.

Secondly, for thick tissues, the single-scale generator cannot recover the fibrosis and quantitative results are also far from satisfactory compared with the multi-scale generator, which shows the importance of the multi-scale model for handling complicated data.  

Additionally, the single-scale generator on thin sections even achieves better FID than the multi-scale generator on thick tissues (21.74 vs 42.39). That means even increasing the complexity of the model cannot completely offset the impact of data complexity. Virtual staining on thick tissue is still difficult to achieve comparable results on thin slice data. 

\section{Conclusion}
In this paper, we present ThickV-Stain for virtual histological staining on unprocessed thick tissues. Specifically, we design a multi-scale generator to fuse large receptive field image features to achieve virtual staining on complex data.  We also use a well-trained lung adenocarcinoma detection model to demonstrate the potential of our generated staining to be integrated with other downstream pathological image analyses tasks. With our proposed ThickV-Stain, the staining task of thick samples can be implemented, allowing pathologists to identify pathological features on unprocessed samples directly, thus providing an alternative to rapid pathology.


% Acknowledgments---Will not appear in anonymized version
\midlacknowledgments{This work was supported by the Research Grants Council of the Hong Kong Special Administrative Region (16208620 \& 26203619) and an internal grant at HKUST (OKT21EG12). The authors would like to thank Dr. Ronald C. K. Chan for the valuable discussion, and Dr. Michael K. Y. Hsin for patient recruitment. The lung cancer samples collected in this paper are collected from the Queen Mary Hospital. All human experiments were carried out in conformity with a clinical research ethics review approved by the Institutional Review Board of the University of Hong Kong/ Hospital Authority Hong Kong West Cluster (HKU/HA HKW) (reference number: UW 20-335), and informed consent was obtained from all lung cancer tissue donors.}


\bibliography{midl24_057}

\appendix
\section{Example of downstream task performed on virtually stained results}
\begin{figure}[htbp]
\centerline{\includegraphics[width=\columnwidth]{figures/7.pdf}}
\centering
\caption{Comparison between pathologist’s annotation and artificial intelligence (AI)-based tumor detection. The left column is tumor region annotation from pathologists for comparison, where the red lines highlight the tumor region and green areas indicate the normal region. The right part is AI-based tumor prediction results on both virtual staining and actual H\&E staining, in which areas in red and blue mean a higher and lower probability of tumor, respectively. }
\label{fig5}
\end{figure}

\section{Score table from pathologists}
\begin{table}[htbp]
    \centering
    \caption{Raw data of score table from pathologists. a) UTOM, b) CUT, c) ThickV-Stain, d) CycleGAN}
    \scalebox{0.85}{
    \begin{tabular}{|c|ccccc|ccccc|ccccc|}
    \hline
          Tissue & \multicolumn{5}{|c|}{\textbf{Pathologist 1}} & \multicolumn{5}{|c|}{\textbf{Pathologist 1}} &\multicolumn{5}{|c|}{\textbf{Average}} \\ 
          \cline{2-16}
          
          No. & \textbf{FD} & \textbf{AC} & \textbf{ND} & \textbf{EF} & \textbf{OS}& \textbf{FD} & \textbf{AC} & \textbf{ND} & \textbf{EF} & \textbf{OS}& \textbf{FD} & \textbf{AC} & \textbf{ND} & \textbf{EF} & \textbf{OS} \\ \hline

          1(a) & 5 & 3 & 2 & 1 & 2 & 3.5 & 2.5 & 3 & 3.5 & 3 & 4.25 & 2.75 & 2.5 & 2.25 & 2.5 \\
          1(b) & 4 & 3 & 2 & 1 & 2 & 1.5 & 3.5 & 3 & 3 & 3.5 & 2.75 & 3.25 & 2.5 & 2 & 2.75 \\
          1(c) & 4 & 4 & 3 & 3 & 4 & 5 & 4 & 3.5 & 4 & 4.5 & \textbf{4.5} & \textbf{4} & \textbf{3.25} & \textbf{3.5} & \textbf{4.25} \\
          1(d) & 1 & 2 & 3 & 1 & 1 & 3.5 & 2 & 1.5 & 1.5 & 2 & 2.25 & 2 & 2.25 & 1.25 & 1.5 \\
          \hline

          2(a) & 5 & 3 & 1 & 1 & 2 & 3 & 2 & 1.5 & 2.5 & 3.5 & 4 & 2.5 & 1.25 & 1.75 & 2.75 \\
          2(b) & 4 & 3 & 2 & 2 & 2 & 1.5 & 4 & 3.5 & 3.5 & 3 & 2.75 & \textbf{3.5} & 2.75 & \textbf{2.75} & 2.5 \\
          2(c) & 5 & 3 & 3 & 2 & 3 & 4 & 3.5 & 2.5 & 3 & 4 & \textbf{4.5} & 3.25 & 2.75 & 2.5 & \textbf{3.5} \\
          2(d) & 1 & 1 & 4 & 1 & 1 & 3 & 3.5 & 3.5 & 2 & 2.5 & 2 & 2.25 & \textbf{3.75} & 1.5 & 1.75 \\
          \hline

          3(a) & 5 & 3 & 2 & 1 & 3 & 2 & 2 & 2 & 4 & 3.5 & 3.5 & 2.5 & 2 & 2.5 & 3.25 \\
          3(b) & 4 & 3 & 1 & 2 & 2 & 1.5 & 2 & 2 & 3.5 & 3 & 2.75 & 2.5 & 1.5 & 2.75 & 2.5 \\
          3(c) & 5 & 2 & 2 & 3 & 3 & 3.5 & 3 & 3 & 3.5 & 4 & \textbf{4.25} & 2.5 & \textbf{2.5} & \textbf{3.25} & \textbf{3.5} \\
          3(d) & 1 & 1 & 2 & 1 & 1 & 2 & 1 & 1.5 & 1.5 & 2 & 1.5 & 1 & 1.75 & 1.25 & 1.5 \\
          \hline

          4(a) & 5 & 3 & 3 & 1 & 4 & 4 & 3.5 & 3 & 4.5 & 4 & 4.5 & 3.25 & 3 & 2.75 & 4 \\
          4(b) & 4 & 2 & 2 & 2 & 3 & 1.5 & 2 & 3 & 3.5 & 2.5 & 2.75 & 2 & 2.5 & 2.75 & 2.75 \\
          4(c) & 5 & 3 & 3 & 3 & 4 & 5 & 4 & 3.5 & 4.5 & 5 & \textbf{5} & \textbf{3.5} & \textbf{3.25} & \textbf{3.75} & \textbf{4.5} \\
          4(d) & 1 & 1 & 1 & 1 & 1 & 3 & 1.5 & 2 & 2 & 2 & 2 & 1.25 & 1.5 & 1.5 & 1.5 \\ 
          \hline

          5(a) & 5 & 3 & 2 & 1 & 2 & 3 & 2 & 2 & 3 & 3 & 4 & 2.5 & 2 & 2 & 2.5 \\
          5(b) & 5 & 3 & 2 & 1 & 2 & 2 & 2.5 & 1 & 1.5 & 2 & 3.5 & 2.75 & 1.5 & 1.25 & 2 \\
          5(c) & 5 & 4 & 2 & 2 & 3 & 4 & 3.5 & 3 & 3 & 4 & \textbf{4.5} & \textbf{3.75} & \textbf{2.5} & \textbf{2.5} & \textbf{3.5} \\
          5(d) & 2 & 1 & 2 & 1 & 1 & 3 & 1 & 1.5 & 1 & 1.5 & 2.5 & 1 & 1.75 & 1 & 1.25 \\
          \hline

          6(a) & 5 & 3 & 3 & 2 & 2 & 4 & 3.5 & 3 & 3.5 & 3 & 4.5 & 3.25 & 3 & 2.75 & 2.5 \\
          6(b) & 4 & 4 & 3 & 1 & 2 & 1.5 & 3.5 & 4 & 2.5 & 3.5 & 2.75 & \textbf{3.75} & \textbf{3.5} & 1.75 & 2.75 \\
          6(c) & 5 & 3 & 2 & 3 & 3 & 4 & 3.5 & 3 & 3.5 & 4 & 4.5 & 3.25 & 2.5 & \textbf{3.25} & \textbf{3.5} \\
          6(d) & 2 & 1 & 3 & 1 & 1 & 2.5 & 3 & 3 & 2.5 & 3 & 2.25 & 2 & 3 & 1.75 & 2 \\
          \hline

          7(a) & 4 & 4 & 3 & 3 & 4 & 4 & 2.5 & 1.5 & 3 & 3 & 4 & 3.25 & 2.25 & 3 & 3.5 \\
          7(b) & 3 & 2 & 3 & 1 & 3 & 1.5 & 1.5 & 1.5 & 2 & 2 & 2.25 & 1.75 & 2.25 & 1.5 & 2.5 \\
          7(c) & 5 & 4 & 3 & 3 & 4 & 5 & 3.5 & 2.5 & 4 & 4 & \textbf{5} & \textbf{3.75} & 2.75 & \textbf{3.5} & \textbf{4} \\
          7(d) & 1 & 1 & 4 & 1 & 1 & 3 & 1.5 & 1.5 & 1.5 & 2 & 2 & 1.25 & 2.75 & 1.25 & 1.5 \\
          \hline

    \end{tabular}
    }
    \label{tab3}
\end{table}


\end{document}
