% This is samplepaper.tex, a sample chapter demonstrating the
% LLNCS macro package for Springer Computer Science proceedings;
% Version 2.21 of 2022/01/12
%
\documentclass[runningheads]{llncs}
%
\usepackage[T1]{fontenc}
\usepackage{amsmath}
\usepackage[figuresright]{rotating}
% T1 fonts will be used to generate the final print and online PDFs,
% so please use T1 fonts in your manuscript whenever possible.
% Other font encondings may result in incorrect characters.
%
\usepackage{graphicx}
% Used for displaying a sample figure. If possible, figure files should
% be included in EPS format.
%
% If you use the hyperref package, please uncomment the following two lines
% to display URLs in blue roman font according to Springer's eBook style:
%\usepackage{color}
%\renewcommand\UrlFont{\color{blue}\rmfamily}
\usepackage[pagebackref=true,breaklinks=true,colorlinks,bookmarks=false]{hyperref}
%
\begin{document}
%
\title{DLUNet: Semi-supervised Learning based Dual-Light UNet for Multi-organ Segmentation}
%
\titlerunning{DLUNet}
% If the paper title is too long for the running head, you can set
% an abbreviated paper title here
%
\author{Haoran Lai \inst{1}\and
Tao Wang\inst{2} \and
Shuoling Zhou\inst{3}}
\authorrunning{Haoran Lai et al.}
% First names are abbreviated in the running head.
% If there are more than two authors, 'et al.' is used.
%
\institute{Guangdong Provincial Key
Laboratory of Medical Image Processing, Southern Medical University,
Guangzhou, 510515, China \\ \email{hanranlai@163.com} \and
Guangdong Provincial Key
Laboratory of Medical Image Processing, Southern Medical University,
Guangzhou, 510515, China \\ \email{wangtao\_9802@sina.com} \and
Guangdong Provincial Key
Laboratory of Medical Image Processing, Southern Medical University,
Guangzhou, 510515, China \\ \email{zslandsouling@163.com}}

% \email{lncs@springer.com} \and
% \email{lncs@springer.com} \and
% \email{lncs@springer.com}}
% \and
% Springer Heidelberg, Tiergartenstr. 17, 69121 Heidelberg, Germany
% \email{lncs@springer.com}\\
% \url{http://www.springer.com/gp/computer-science/lncs} 
% \and
% ABC Institute, Rupert-Karls-University Heidelberg, Heidelberg, Germany\\
% \email{\{abc,lncs\}@uni-heidelberg.de}}
%
\maketitle              % typeset the header of the contribution
%
\begin{abstract}
    The manual ground truth of abdominal multi-organ is labor-intensive. In order to make full use of CT data, we developed a semi-supervised learning based dual-light UNet. In the training phase, it consists of two light UNets, which make full use of label and unlabeled data simultaneously by using consistent-based learning. Moreover, separable convolution and residual concatenation was introduced light UNet to reduce the computational cost. Further, a robust segmentation loss was applied to improve the performance. In the inference phase, only a light UNet is used, which required low time cost and less GPU memory utilization. The average DSC of this method in the validation set is 0.8718.  The code is available in \href{https://github.com/laihaoran/Semi-Supervised-nnUNet}{https://github.com/laihaoran/Semi-Supervised-nnUNet}.
\keywords{Semi-supervised learning \and UNet \and Robust segmentation loss.}
\end{abstract}



\section{Introduction}

Fast automatic abdominal multi-organs segmentation can greatly improve the labeling speed of radiologists. However, there are still a series of challenges for automatic abdominal multi-organ segmentation: 1) Manual labeling of ground truth requires significant labor cost. 2) There is a large amount of unlabeled data that can be used to improve performance. 3) Medical image segmentation suffers from unclear boundaries. 4) Integrated automatic segmentation algorithms need to meet the requirements of low time cost and less GPU memory utilization.

Semi-supervised learning can be achieved by combining a small amount of labeled data and a large amount of unlabeled data, thus enabling training on small labeled datasets. The current major semi-supervised learning algorithms can be categorized into 1) pseudo-labeling-based learning~\cite{arazo2020pseudo,he2021re} and 2) consistency-based learning~\cite{Xiaokang2021cvpr,luo2020semi}. The prospects of abdominal multi-organ segmentation have multiple categories and dense distribution (multiple categories may exist in a region), which is suitable for consistency-based learning.

Therefore, we propose a semi-supervised learning based dual-light UNet to achieve fast automatic abdominal multi-organs segmentation. First, consistency learning strategy was introduced in to the proposed network to effectively utilize the large amount of unlabeled data. Second, a light UNet was proposed to achieve efficient and fast automatic segmentation. Then, a robust segmentation loss function was applied to overcome the challenge of tiny foreground. Finally, this proposed method achieves fast and accurate automatic abdominal multi-organ segmentation.

The main contributions of this work are as follows.
\begin{itemize}
    \item[$\bullet$] We use a network consistency-based semi-supervised learning strategy to leverage large amounts of unlabeled data.
    
    \item[$\bullet$] We propose a light UNet for fast and efficient automatic abdominal multi-organs segmentation.
    
    \item[$\bullet$] We adopt a robust segmentation loss function to effectively overcome the challenge of tiny foreground.
    \end{itemize}

    \begin{figure}[htbp]
        \centering
        \includegraphics[scale=0.3]{imgs/ssl.png}
        \caption{Illustrating the architectures for consistent learning.}
        \label{fig:ssl}
        \end{figure}

\section{Method}
%###########################
\subsection{Consistency-based learning}


As shown in Figure~\ref{fig:ssl}, let the $X_{l} = \{x_{li}, i\in N\}$ and  $X_{u} = \{x_{ui}, i\in M\}$ be the labeled and unlabeled data, respectively, where $N$ and $M$ are the number of labeled and unlabeled data, respectively. In our experiment, the condition of $\ll M$ is established for semi-supervised learning. First, dual identical networks  $f(\theta_{A}) $ and $f(\theta_{B})$ are built with different parameter initialization methods. Then, dual identical networks  $f(\theta_{A}) $ and $f(\theta_{B})$ are trained by using the labeled data for abdominal organ segmentation, respectively.
\begin{equation}
    \begin{aligned}
	f(x_{li}; \theta_{A}) = p_{A,li}\\
    f(x_{li}; \theta_{B}) = p_{B,li}
    \end{aligned}
\end{equation}
where $p$ is the probability map. Next, the trained network is used to obtain different probability map of unlabeled data and their pseudo-labels.


\begin{equation}
    \begin{aligned}
        f(x_{ui}; \theta_{A}) = p_{A,ui}, f(x_{uj}; \theta_{A}) = p_{A,uj}\\
        f(x_{ui}; \theta_{B}) = p_{B,ui}, f(x_{uj}; \theta_{B}) = p_{B,uj}
    \end{aligned}
\end{equation}

\begin{equation}
    \begin{aligned}
        y_{A, ui} = \text{argmax} (p_{A,ui}), y_{A, uj} = \text{argmax}(p_{A,uj})\\
        y_{B, ui} = \text{argmax} (p_{A,ui}), y_{B, uj} = \text{argmax}(p_{B,uj})
    \end{aligned}
\end{equation}

\noindent CutMix operation~\cite{yun2019cutmix} is implemented on different unlabeled data and pseudo labels:

\begin{equation}
    \begin{aligned}
        x_{uij} = \mathbf{H} \odot  x_{ui}+ (1 - \mathbf{H}) \odot x_{uj}\\
        y_{A, uij} = \mathbf{H} \odot  y_{A, ui}+ (1 - \mathbf{H}) \odot y_{A, uj}\\
        y_{B, uij} = \mathbf{H} \odot  y_{B, ui}+ (1 - \mathbf{H}) \odot y_{B, uj}
    \end{aligned}
\end{equation}

In this situation, the outputs of the two networks can be used to supervise for each other, which achieves the network consistency-based learning.

\begin{equation}
    \begin{aligned}
        f(x_{uij}; \theta_{A}) = p_{A,uij} \longrightarrow y_{B, uij}\\
        f(x_{uij}; \theta_{B}) = p_{B,uij} \longrightarrow y_{A, uij}
    \end{aligned}
\end{equation}

During each iteration, the label data and the unlabel data are simultaneously input to the network for optimization.


\subsection{Light UNet}
To accelerate inference speed and reduce the GPU memory utilization, we modify the UNet in nnU-Net\cite{isensee2021nnu}. A light UNet was presented in Figure~\ref{fig:Network}.
\begin{itemize}
 \item  We replace the original convolution with depthwise separable convolution~\cite{chollet2017xception}, thus reducing the number of trainable parameters.
 \item  Residual connection~\cite{he2016deep} was introduced between all convolution layers, including encoder and decoder, thus improving the representational ability of the UNet.
\end{itemize}


\begin{figure}[htbp]
    \centering
    \includegraphics[scale=0.3]{imgs/UNet.jpg}
    \caption{The architecture of Light UNet.}
    \label{fig:Network}
    \end{figure}


\subsection{Robust segmentation Loss}
In the segmentation task, the commonly used segmentation loss is a combination of Dice loss and cross entropy (CE) loss, which have been proved be robust in various medical image segmentation task \cite{LossOdyssey}. In this paper, based on the previous segmentation loss, the idea of mean absolute error (MAE) loss was introduced into Dice and CE loss respectively. Therefore, a robust segmentation loss fuction $\mathcal{L}_{RS}$ was proposed, which consists of noise robust dice loss $\mathcal{L}_{NRD}$ and taylor cross entropy loss $\mathcal{L}_{TCE}$. 

\begin{equation}
    \mathcal{L}_{RS} =   \mathcal{L}_{NRD} + \mathcal{L}_{TCE}
\end{equation}

\begin{equation}
    \mathcal{L}_{NRD} =  \frac{\sum_{n = 1}^{DWH} | \mu _{n} - \upsilon _{n}\vert ^{\gamma }}
    {\sum_{n = 1}^{DWH} \mu_{n}^{2} + \sum_{n = 1}^{DWH} \upsilon_{n}^{2} + \epsilon }
\end{equation}

\begin{equation}
    \mathcal{L}_{TCE} =  \sum_{n = 1}^{DWH} (1 - \mu _{n,\upsilon=1}) + \frac{\sum_{n = 1}^{DWH} ( 1 - \mu _{n,\upsilon=1})^{2} }{2}
\end{equation}
\noindent where $D$, $W$ and $H$ are the depth, width and height of input, respectively. $\mu$ and $\upsilon$ are the voxels of softmax output and ground truth, respectively.  

\subsection{Preprocessing and Inference}
The dataset was preprocessed by nnU-Net configuration\cite{isensee2021nnu}, including HU value clipping, HU values normalization, and resolution uniformity. In order to achieve category-balanced cropping for unlabeled data in training stage, a nnU-Net model was trained in advance using a small amount of labeled data. Then, a pseudo-label for unlabeled data is generated, which is only involved in achieving category-balanced cropping and not in other utilization.


In the inference phase, a patch shift-based approach was used to generate mask outputs for the entire 3D CT. We used 0.5 shift steps for each patch to alleviate the misclassification of the results by local information. Moreover, all patchs were flipped along three axes to generate robust performance.


\section{Experiments}
\subsection{Dataset and evaluation measures}
The FLARE2022 dataset is curated from more than 20 medical groups under the license permission, including MSD~\cite{simpson2019MSD}, KiTS~\cite{KiTS,KiTSDataset}, AbdomenCT-1K~\cite{AbdomenCT-1K}, and TCIA~\cite{clark2013TCIA}. The training set includes 50 labelled CT scans with pancreas disease and 2000 unlabelled CT scans with liver, kidney, spleen, or pancreas diseases. The validation set includes 50 CT scans with liver, kidney, spleen, or pancreas diseases.
The testing set includes 200 CT scans where 100 cases has liver, kidney, spleen, or pancreas diseases and the other 100 cases has uterine corpus endometrial, urothelial bladder, stomach, sarcomas, or ovarian diseases. All the CT scans only have image information and the center information is not available.

The evaluation measures consist of two accuracy measures: Dice Similarity Coefficient (DSC) and Normalized Surface Dice (NSD), and three running efficiency measures: running time, area under GPU memory-time curve, and area under CPU utilization-time curve. Only DSC score was presented in the experiments. All measures will be used to compute the ranking. Moreover, the GPU memory consumption has a 2 GB tolerance.




\subsection{Implementation details}
\subsubsection{Environment settings}
The development environments and requirements are presented in Table~\ref{table:env}.


\begin{table}[!htbp]
\caption{Development environments and requirements.}\label{table:env}
\centering
\begin{tabular}{ll}
\hline
Windows/Ubuntu version       & Ubuntu 18.04.5 LTS\\
\hline
CPU   & Intel(R) Xeon(R) Gold 5218 CPU @ 2.30GHz \\
\hline
RAM                         & 503 GB\\
\hline
GPU (number and type)                         & Two NVIDIA RTX 2080Ti 11G\\
\hline
CUDA version                  & 11.0\\                          \hline
Programming language                 & Python 3.7\\ 
\hline
Deep learning framework & Pytorch (Torch 1.11, torchvision 0.2.2) \\
\hline          
\end{tabular}
\end{table}


\subsubsection{Training protocols}
Ther training protocols are presented in Table~\ref{table:training}



\begin{table*}[!htbp]
\caption{Training protocols.}
\label{table:training}
\begin{center}
% \resizebox{0.47\textwidth}{!}{
\begin{tabular}{ll} 
\hline
Network initialization         & ``he" normal initialization\\
\hline
Batch size                    & 1 \\
\hline 
Patch size & 56$\times$160$\times$160  \\ 
\hline 
Target resolution & 2.5$\times$1.5$\times$1.5  \\ 
\hline
Total epochs & 1000 \\
\hline
Optimizer          & SGD with nesterov momentum ($\mu=0.99$)          \\ \hline
Initial learning rate (lr)  & 0.01 \\ \hline
Lr decay schedule & halved by 200 epochs \\
\hline
Training time                                           &  276 hours \\  \hline
Loss function                                           &  RRD + TCE \\  \hline
Number of model parameters    & 5.59M  \\ \hline
Number of flops & 33.81G  \\ \hline
%CO$_2$eq & NaN Kg\footnote{https://github.com/lfwa/%carbontracker/} \\  \hline
\end{tabular}

\end{center}
\end{table*}



\section{Results and discussion}
A public unlabeled validation set was used to evaluate the experiment results, which can be uploaded to the online\footnote{https://flare22.grand-challenge.org/evaluation/challenge/submissions/create/} for metrics.


\subsection{Ablation of semi-supervised learning}
Table~\ref{table:AblationSSL} shows the effects of introducing semi-supervised learning in the nnU-Net and light unet on the final segmentation performance, respectively. Two conclusions can be found from Table~\ref{table:AblationSSL}: (1) The segmentation performance of the light unet is inferior to the nnU-Net due to the less parameters, but the light unet can speed up the inference and reduce the GPU memory utilization. (2) The introduction of semi-supervised learning has greatly improved the segmentation performance for both. Further, the performance improvement is greater for the light unet with a smaller number of parameters than nnU-Net, which may be caused by model with few parameters has strong potential for improvement. 


\begin{table}[!htbp]
    \tiny
    \caption{Ablation of semi-supervised learning (SSL). LV, RK, SL, PC, AT, IVC, RAG, LAG, GB, EH, SM, DD, and LK are short for Liver, Right Kidney, Spleen,  Pancreas, Aorta, Inferior Vena Cava, Right Adrenal Gland, Left Adrenal Gland, Gallbladder, Esophagus, Stomach, and Left kidney, respectively.}
    \label{table:AblationSSL}
    \begin{center}
    % \resizebox{0.47\textwidth}{!}{
    \begin{tabular}{ccccccccccccccc} 
    \hline
    Method         & Mean & LV & RK& SL& PC& AT& IVC& RAG& LAG& GB& EH& SM& DD &LK\\
    \hline
    nnU-Net w/o SSL & 0.869 & 0.967 & 0.880 & 0.941 & 0.841 & 0.949 & 0.882 & 0.822 & 0.819 & 0.821 & 0.877& 0.885 & 0.748 &  0.871 \\
    % \hline 
 
    nnU-Net w SSL & \textbf{0.895} & 0.978 & 0.897 & 0.973 & 0.909 & 0.973 & 0.922 & 0.839 & 0.826 & 0.779 & 0.900 & 0.914 & 0.838 &  0.888 \\
    \hline 

    Light UNet w/o SSL & 0.837  & 0.965 & 0.869 & 0.932 & 0.830 & 0.945 & 0.860 & 0.766 & 0.731 & 0.731 & 0.837 & 0.858 & 0.717 &  0.843 \\
    % \hline

    Light UNet w SSL & \textbf{0.878} & 0.976 & 0.910 & 0.969 & 0.894 & 0.960 & 0.896 & 0.807 & 0.763 & 0.764 & 0.865 & 0.915 & 0.799 &  0.891 \\
    \hline
    \end{tabular}
    \end{center}
    \end{table}


    \begin{table}[!htbp]
        \tiny
        \caption{Comparison of loss function.}
        \label{table:AblationLoss}
        \begin{center}
        % \resizebox{0.47\textwidth}{!}{
        \begin{tabular}{ccccccccccccccc} 
        \hline
        Loss & Mean & LV & RK& SL& PC& AT& IVC& RAG& LAG& GB& EH& SM& DD &LK\\
        \hline
        Dice+CE & 0.869 & \textbf{0.972} & \textbf{0.915} & \textbf{0.954}& \textbf{0.861}& \textbf{0.958}& \textbf{0.884}& \textbf{0.823}& 0.814& 0.720& 0.867& \textbf{0.888}& \textbf{0.751}&\textbf{0.889}\\
    
        NRD+TCE & \textbf{0.870} & 0.967 & 0.880& 0.941& 0.841& 0.949& 0.882& 0.822& \textbf{0.819}& \color{red}{\textbf{0.821}}& \textbf{0.877}& 0.885& 0.748 &0.871\\
        \hline
        \end{tabular}
        \end{center}
        \end{table}

\subsection{Comparison of loss function}
From Table Table~\ref{table:AblationLoss}, it can be found that the robust segmentation loss is superior to the combination of dice and CE loss in terms of overall performance. Moreover, it can be noticed that although the robust segmentation loss is inferior to the combination of dice and CE loss for the segmentation of most organs from the segmentation performance of different organs, the robust segmentation loss has a great advantage for the segmentation of the gallbladder. The gallbladder belongs to the small target segmentation region, therefore, we conclude that robust segmentation loss has some advantages for the small target region.





\subsection{Segmentation efficiency results}
Considering the balance between segmentation performance and inference speed, we reduce the original 7 times flips in nnU-net to 3 tmes flips (tta). Moreover, in order to address the phenomenon that particularly large samples in the image will be out of memory during the inference process, we only keep the final generated labels and do not keep the intermediate network output (RAM). The result was performed in Table~\ref{table:AblationPost}.

We did not upload docker to test computational efficiency issues. However, we tested on our own platform to test the optimization of computational efficiency. In the end, we achieved a test time of 0.67 hour on 50 validation samples, maximum ram is 18G, and GPU memory is 2045MB.

\begin{table}[!htbp]
    \tiny
    \caption{Extra Processing for fianl result. IS(H) is short for inference speed, with hour as unit.}
    \label{table:AblationPost}
    \begin{center}
    % \resizebox{0.47\textwidth}{!}{
    \begin{tabular}{lccccccccccccccc} 
    \hline
    Method  & Mean  & IS(H) & LV & RK& SL& PC& AT& IVC& RAG& LAG& GB& EH& SM& DD &LK\\
    \hline
    DLUNet & 0.878 & ~ & 0.976 & 0.910 & 0.969 & 0.894 & 0.960 & 0.896 & 0.807 & 0.763 & 0.764 & 0.865 & 0.915 & 0.799 &  0.891\\
    DLUNet+tta & \textbf{0.884} & 2.00 & 0.977 & 0.910 & 0.972 & 0.899 & 0.962 & 0.901 & 0.816 & 0.762 & 0.801 & 0.873 & 0.917 & 0.800 &  0.895\\ 
    DLUNet+tta+RAM & 0.872 & \textbf{0.67} & 0.973 & 0.903 & 0.964 & 0.890 & 0.948 & 0.888 & 0.789 & 0.741 & 0.792 & 0.857 & 0.911 & 0.795 &  0.885 \\ 
    \hline
    \end{tabular}
    \end{center}
    \end{table}

    \begin{figure}[htbp]
        \centering
        \includegraphics[scale=0.3]{imgs/Vsidual.png}
        \caption{Qualitative results on easy (case 06 and 21) and hard (case 47 and 48) examples. First column is the image, second column is the ground truth, third column is the predicted results by Light U-Net without ssl, third column is the predicted results by DLUNet with ssl.}
        \label{fig:visual}
        \end{figure}
    

\subsection{Qualitative results}
Figure~\ref{fig:visual} presents some easy and hard examples on validation set,  and quantitative result is illustrated in Table~\ref{table:visual}. Comparing (Case 06 and Case 21) and (Case 47 and Case 48), we can find that our proposed method does not work well for lesion-affected organs. For example, the liver cancer region is wrongly identified in Case 47 and Case 48, especially Case 48. This situation may be due to our proposed method is implemented by a patch-based training strategy, which lacks global information.


\begin{table}[!htbp]
    \tiny
    \caption{The DSC scores of easy and hard examples.}
    \label{table:visual}
    \begin{center}
    % \resizebox{0.47\textwidth}{!}{
    \begin{tabular}{cccccccccccccccc} 
    \hline
    Example & Method & Mean & LV & RK& SL& PC& AT& IVC& RAG& LAG& GB& EH& SM& DD &LK\\
    \hline
    Case 06 & w/o ssl &0.915 & 0.983 & 0.974 & 0.978 & 0.924 & 0.965 & 0.944 & 0.899 & 0.894 & 1.000 & 0.908& 0.936 & 0.756 &  0.729 \\
     & w ssl &\textbf{0.924} & 0.985 & 0.983 & 0.983 & 0.929 & 0.977 & 0.955 & 0.927 & 0.920 & 1.000 & 0.922 & 0.940 & 0.760 &  0.725 \\
    \hline

    Case 21 &w/o ssl & 0.946 & 0.985 & 0.972 & 0.983 & 0.926 & 0.966 & 0.937 & 0.869 & 0.864 & 1.000 & 0.935 & 0.969 & 0.926 &  0.973 \\
     & w ssl &\textbf{0.957}& 0.988 & 0.980 & 0.989 & 0.932 & 0.980 & 0.946 & 0.894 & 0.897 & 1.000 & 0.949 & 0.973 & 0.936 &  0.981 \\
    \hline

    Case 47 & w/o ssl & 0.798 & 0.885 & 0.978 & 0.866 & 0.798 & 0.936 & \textbf{0.665} & \textbf{0.677} & 0.818 & \textbf{0.676} & 0.807& 0.904 & \textbf{0.395} &  0.977 \\
     & w ssl & \textbf{0.805} & 0.882 & 0.986 & 0.868 & 0.805 & 0.954 & \textbf{0.682} & \textbf{0.676} & 0.833 & \textbf{0.707} & 0.815& 0.918 & \textbf{0.358} &  0.983 \\
    \hline

    Case 48 & w/o ssl & 0.716 & 0.971 & 0.971 & 0.667 & 0.841 & 0.958 & \textbf{0.461} & \textbf{0.679} & 0.856 & \textbf{0.000} & 0.693& 0.598 & 0.796 &  0.811 \\
     & w ssl & \textbf{0.729} & 0.972 & 0.978 & 0.702 & 0.861 & 0.970 & \textbf{0.456} & \textbf{0.747} & 0.869 & \textbf{0.000} & 0.692& 0.623 & 0.795 &  0.812 \\

    \hline
    \end{tabular}
    \end{center}
    \end{table}



\subsection{The performance of testing set}

As shown in Table~\ref{table:Testing}, our method shows a competitive segmentation performance on the testing set. Moreover, we find that all metrics of case 97 are 0. This may be caused by the fact that the view of case 97 is flipped, which leads to the misjudgment of the inference optimization algorithm and terminates the inference in advance, resulting in not generating the correct segmentation output. Since the focus of our method is on segmentation performance improvement, the optimization of inference speed is neglected, resulting in the lack of advantage of our method in the final composite score.


\begin{table}[!htbp]
    \tiny
    \caption{The performance of testing set.}
    \label{table:Testing}
    \begin{center}
    % \resizebox{0.47\textwidth}{!}{
    \begin{tabular}{ccccccccccccccc} 
    \hline
    Metric & Mean & LV & RK& SL& PC& AT& IVC& RAG& LAG& GB& EH& SM& DD &LK\\
    \hline
    DSC & 0.881 & 0.968 & 0.941 & 0.949 & 0.854 & 0.949 & 0.900 & 0.815 & 0.805 & 0.809 & 0.805& 0.924 & 0.797 &  0.937 \\
    \hline
    NSD & 0.940 & 0.969 & 0.960 & 0.961 & 0.954 & 0.982 & 0.923 & 0.953 & 0.939 & 0.828 & 0.913& 0.951 & 0.926 &  0.958 \\
    \hline

    Times(s)& 73.92\\
    \hline
    AUC GPU & 138831\\
    \hline
    AUC CPU & 1195\\
    \hline

    \end{tabular}
    \end{center}
    \end{table}




\subsection{Limitation and future work}
In this paper, we do not use existing deep learning model packaging techniques (e.g., TensorRT) to package the model, reduce computational memory, and increase inference speed. Therefore, the implementation of the operation can be considered in the future work. 




\section{Conclusion}
The FLARE2022 competition aims to design an efficient and accuracy abdominal multi-organ segmentation network by using a small amount of labeled data and a large amount of unlabeled data. In this paper, we proposed DLUNet for this task. First, consistent-based learning was introduced to achieve semi-supervised learning. Second, separable convolution and residual connection were used to greatly reduce the computational cost. Moreover, a robust segmentation loss was applied to improve segmentation performance. Experiments prove that the DLUNet achieves a certain balance in terms of model parameters, computation time, GPU memory utilization, and segmentation performance. The method is promising for the task.


\subsubsection{Acknowledgements} The authors of this paper declare that the segmentation method they implemented for participation in the FLARE 2022 challenge has not used any pre-trained models nor additional datasets other than those provided by the organizers. The proposed solution is fully automatic without any manual intervention.


%
% ---- Bibliography ----
%
% BibTeX users should specify bibliography style 'splncs04'.
% References will then be sorted and formatted in the correct style.
%
\bibliographystyle{splncs04}
\bibliography{ref}

\end{document}
