\documentclass{midl} % Include author names
%\documentclass[anon]{midl} % Anonymized submission

% The following packages will be automatically loaded:
% jmlr, amsmath, amssymb, natbib, graphicx, url, algorithm2e
% ifoddpage, relsize and probably more
% make sure they are installed with your latex distribution

\usepackage{mwe} % to get dummy images
\usepackage[skip=0pt]{caption}

\jmlryear{2020}
\jmlrworkshop{Full Paper -- MIDL 2020}

\title[Adversarial Domain Adaptation for Cell Segmentation]{Adversarial Domain Adaptation for \\Cell Segmentation}

 % Use \Name{Author Name} to specify the name.
 % If the surname contains spaces, enclose the surname
 % in braces, e.g. \Name{John {Smith Jones}} similarly
 % if the name has a "von" part, e.g \Name{Jane {de Winter}}.
 % If the first letter in the forenames is a diacritic
 % enclose the diacritic in braces, e.g. \Name{{\'E}louise Smith}

 % Two authors with the same address
 \midlauthor{\Name{Mohammad Minhazul Haq\nametag{$^{1}$}} \Email{mohammadminhazu.haq@mavs.uta.edu}\\
 \Name{Junzhou Huang\nametag{$^{1}$}} \Email{jzhuang@uta.edu}\\
 \addr $^{1}$ Department of Computer Science and Engineering, University of Texas at Arlington,\\ Arlington, TX 76019, USA}


 % Three or more authors with the same address:
 % \midlauthor{\Name{Author Name1} \Email{an1@sample.edu}\\
 %  \Name{Author Name2} \Email{an2@sample.edu}\\
 %  \Name{Author Name3} \Email{an3@sample.edu}\\
 %  \addr Address}


% Authors with different addresses:
% \midlauthor{\Name{Author Name1} \Email{abc@sample.edu}\\
% \addr Address 1
% \AND
% \Name{Author Name2} \Email{xyz@sample.edu}\\
% \addr Address 2
% }

%\footnotetext[1]{Contributed equally}

% More complicate cases, e.g. with dual affiliations and joint authorship
%\midlauthor{\Name{Author Name1\midljointauthortext{Contributed equally}\nametag{$^{1,2}$}} \Email{abc@sample.edu}\\
%\addr $^{1}$ Address 1 \\
%\addr $^{2}$ Address 2 \AND
%\Name{Author Name2\midlotherjointauthor\nametag{$^{1}$}} \Email{xyz@sample.edu}\\
%\Name{Author Name3\nametag{$^{2}$}} \Email{alphabeta@example.edu}\\
%\Name{Author Name4\midljointauthortext{Contributed equally}\nametag{$^{3}$}} \Email{uvw@foo.ac.uk}\\
%\addr $^{3}$ Address 3 \AND
%\Name{Author Name5\midlotherjointauthor\nametag{$^{4}$}} \Email{fgh@bar.com}\\
%\addr $^{4}$ Address 4
%}



\begin{document}

\maketitle

\begin{abstract}
To successfully train a cell segmentation network in fully-supervised manner for a particular type of organ or cancer, we need the dataset with ground-truth annotations. However, high unavailability of such annotated dataset and tedious labeling process enforce us to discover a way for training with unlabeled dataset. In this paper, we propose a network named CellSegUDA for cell segmentation on the unlabeled dataset (target domain). It is achieved by applying unsupervised domain adaptation (UDA) technique with the help of another labeled dataset (source domain) that may come from other organs or sources. We validate our proposed CellSegUDA on two public cell segmentation datasets and obtain significant improvement as compared with the baseline methods. Finally, considering the scenario when we have a small number of annotations available from the target domain, we extend our work to CellSegSSDA, a semi-supervised domain adaptation (SSDA) based approach. Our SSDA model also gives excellent results which are quite close to the fully-supervised upper bound in target domain.
\end{abstract}

\begin{keywords}
Cell Segmentation, Unsupervised and Semi-supervised Domain Adaptation
\end{keywords}

\section{Introduction}

Convolutional Neural Network (CNN) based approaches like Fully Convolutional Network (FCN) \cite{fcn2014long}, U-Net \cite{unet2015ronneberger}, UNet++ \cite{nestedUnet2018zhou} give very promising results in biomedical image segmentation tasks as well as in cell segmentation problems \cite{localitySensitive2016sirinukunwattana}. However, to successfully train these fully-supervised methods, we need at least a few amount of annotated data i.e., images with their corresponding pixel-level ground-truth labels \cite{monuseg2017kumar,visCnn2014zeiler}. Unfortunately, such well-annotated datasets, even if very small-sized, are highly rare in biomedical domain. Also, collecting an unannotated dataset first, and then doing the manual labeling with the help of experts is also an expensive, time-consuming and tedious process \cite{largeScale2017xu,sifa2019chen}. How if we could train a deep CNN model for cell segmentation without any further needs for the annotations? Domain Adaptation, a subclass of Transfer Learning, provides solution in such scenarios.

\begin{figure}[t]
\floatconts
  {fig:motivation}  
  {\caption{Images from different domains look dissimilar while their pixel-level segmentation outputs are similar. In this figure, source domain and target domain images come from Kidney Renal Clear cell carcinoma (KIRC) and Triple Negative Breast Cancer (TNBC) respectively.}}
  {\includegraphics[width=1\linewidth]{figure_1_haq20}}  
\end{figure}

A multi-level adversarial network based domain adaptation approach for semantic segmentation was proposed by \citet{adaptStructured2018tsai}. \citet{cyCaDA2017hoffman} proposed an unsupervised domain adaptation model utilizing both of pixel-level and feature-level adaptation. \citet{pix2pix2017isola} applied conditional GAN \cite{condGan2014mehdi} for image-to-image translation problems. \citet{crDoCo2019chen} proposed a cross-domain consistency loss based pixel-wise adversarial domain adaptation algorithm. \citet{fcan2018zhang} proposed a fully convolutional adaptation network for semantic segmentation. For different types of biomedical image segmentation, several adversarial network based approaches also have been proposed. A multi-connected domain discriminator based UDA model for brain lesion segmentation was proposed by \citet{udaBrainLesion2016kamnitsas}. \citet{udaCardiothoracic2018dong} introduced another UDA framework for cardiothoracic ratio estimation through chest organ segmentation. \citet{multiOrgan2018mahmood} proposed a cell segmentation approach in  which a large dataset is generated using synthesization. \citet{robustHistopathImageAnalysis2019hou} also synthesized annotated training data for histopathology image segmentation. \citet{advSynthLearning2018huo} proposed an end-to-end CycleGAN \cite{cyclegan2017zhu} based whole abdomen MRI to CT image synthesis and CT splegonmegaly segmentation network.

In this paper, we consider the unannotated dataset, i.e. for which we want to predict the labels, as target domain. Then, with the help of another related but different annotated dataset, referred as source domain, we apply adversarial learning~\cite{gan2014goodfellow} based domain adaptation technique for cell segmentation problem. Thus, our proposed framework, learns from labeled source domain and adapts to the unlabeled target domain. We very carefully observed that, images from different cell datasets, even if collected from different organs or cancer types, exhibit dissimilarity although their corresponding segmentation ground-truth labels are quite similar (see \figureref{fig:motivation}). In summary, ground-truth labels for cell segmentation are domain-invariant.

In this work, we first propose a unsupervised domain adaptation model for cell segmentation. Because of our aforementioned observation, we apply our domain adaptation in the output space rather than in the feature space. With the help of adversarial learning, we train a robust biomedical image segmentation network to generate source-domain look-alike outputs for target images. Additionally, we use a decoder network to make target images and target predictions correlated to each other as much as possible. Finally, we extend our unsupervised domain adaptation technique to semi-supervised domain adaptation (SSDA) considering that we have some annotations available from the target domain.

Conducting extensive experiments on two cell segmentation datasets we conclude that, our proposed UDA method, CellSegUDA, outperforms both of a fully-supervised model~\cite{unet2015ronneberger} trained on source domain and evaluated on target domain, and a baseline UDA model~\cite{udaCardiothoracic2018dong}. Experimental result (see Section 3) also shows that, accuracy of our SSDA strategy appears very close to the upper bound of fully-supervised model trained in target domain.

Thus, the main contributions of this paper are: \textbf{1)} We propose an adversarial learning based unsupervised domain adaptation (UDA) approach to solve cell segmentation problem for unannotated datasets. \textbf{2)} Our proposed method is simple as it does not depend on any data synthesization or data augmentation. \textbf{3)} Our proposed UDA framework can be easily extended to semi-supervised domain adaptation (SSDA) in the scenario where a small portion of the target domain is labeled. \textbf{4)} Extensive and comprehensive experiments on two datasets have demonstrated the superiority of the proposed methods.

\begin{figure}[t]
\floatconts
  {fig:architecture}  
  {\caption{Complete architecture of CellSegUDA. Segmentation network generates segmentation outputs, from which decoder reconstructs input images. Discriminator distinguishes between source domain outputs and target domain outputs.}}
  {\includegraphics[width=1\linewidth]{figure_2_haq20}}  
\end{figure}

\section{Methodology}
Formally, in our cell segmentation problem, we have cell histology patches as input $X$ of size $H \times W \times 3$. Then, we want to predict the segmentation output $\hat{Y}$ of size $H \times W \times 1$. Depending on the domain, we may also have pixel-wise ground-truth label $Y$ of size $H \times W \times 1$ which is basically a binary mask.

Then, in unsupervised domain adaptation problem, we have a source domain with $N_s$ annotated images $\{(X_s, Y_s)\}$, and a target domain which has $N_t$ unannotated images $\{(X_t)\}$. In the case of semi-supervised domain adaptation problem, we assume that our target domain consists of $N_t^l$ images with annotations $\{(X_t^l, Y_t)\}$, and $ N_t^u $ unannotated images $\{(X_t^u)\}$. Our ultimate goal is to learn a cell segmentation model that accurately produces the segmentation output in the target domain.

\subsection{CellSegUDA}
We refer our cell segmentation unsupervised domain adaptation (UDA) model as CellSegUDA which is shown in \figureref{fig:architecture}. CellSegUDA consists of three modules: Segmentation network (S), Decoder (R), and Discriminator (D).\\

\noindent \textbf{Segmentation network (S)} Our segmentation network S takes images $X$ as input and produces the segmentation prediction $\hat{Y}$ of the same size as input, hence $\hat{Y} = S(X)$. This segmentation network can be thought as the generator module of a GAN~\cite{gan2014goodfellow} framework.

We train S to generate the segmentation predictions $\hat{Y_s}$ similar to the ground-truth labels $Y_s$ in source domain. We can not compute any pixel-level loss for target predictions since ground-truth labels are not available for target images in UDA. In practice, we found dice-coefficient loss to be more effective than binary cross-entropy loss for cell segmentation tasks. Therefore, we choose dice-coefficient loss as our segmentation loss:
\begin{equation}
\label{eq:seg_loss_source}
L_{seg}(X_s) = 1 - \frac{2 . Y_s^\prime . \hat{Y_s^\prime}}{Y_s^\prime + \hat{Y_s^\prime}},
\end{equation}
where $Y_s^\prime$ and $\hat{Y_s^\prime}$ are flatten $Y_s$ and $\hat{Y_s}$ respectively.

Training S with only the annotated source data teaches S to make accurate predictions for source images. However, this segmentation network will generate incorrect outputs for target images as there are visual discrepancies between source images and target images. Because of our observation that cell segmentation outputs are domain-invariant, we require S to produce target domain predictions as much as close to the source domain predictions. In other words, we want to make the distribution of target predictions $\hat{Y_t}$ closer to source predictions $\hat{Y_s}$. Thus, we define adversarial loss as:
\begin{equation}
L_{adv}(X_t) = - \frac{1}{H^\prime \times W^\prime} \sum_{h^\prime, w^\prime}{\log{(D(\hat{Y}_t)})},
\end{equation}
where $\hat{Y}_t = S(X_t)$, and $H^\prime$ and $W^\prime$ are height and width of discriminator output $D(\hat{Y}_t)$. This adverserial loss helps S to fool the discriminator so that it considers $\hat{Y_t}$ as source domain segmentation outputs.

Segmentation loss and adversarial loss altogether guides S to generate target domain predicitions $\hat{Y}_t$ which look similar to source domain ground-truths. However, it is highly probable that these target predictions are not well-correlated with corresponding target input images. The ability of reconstructing images from the predictions with similar visual appearance as input images will ensure that there is a correlation between the input image and segmentation output.\\

\noindent \textbf{Decoder (R)} To ensure that our target domain predictions spatially correspond to the target domain images, we use a decoder network R in CellSegUDA. In a similar way to \citet{wnet2017xia}, we consider our segmentation network S as an encoder. Then, decoder R reconstructs target images from the corresponding predictions. Thus, S and R altogether works as an autoencoder.

Using our decoder network R, we first reconstruct target input images $X_t$ from $\hat{Y}_t$. Then, we calculate the reconstruction loss as:
\begin{equation}
L_{recons}(X_t) =  \frac{1}{H \times W \times C} \sum_{h,w,c}{(X_t - R(\hat{Y}_t))}^2,
\end{equation}
where, $R(\hat{Y}_t))$ is the output of decoder for $\hat{Y}_t$, and C is the number of channels of input image X.

Thus, we minimize the following total loss while training our segmentation network:
\begin{equation}
\label{eq:total_loss_uda}
L_s(X_s, X_t) = L_{seg}(X_s) + \lambda_{adv} L_{adv}(X_t) + \lambda_{recons} L_{recons}(X_t),
\end{equation}
where, $\lambda_{adv}$ and $\lambda_{recons}$ are the weights to balance corresponding losses.\\

\noindent \textbf{Discriminator (D)} Since we want to generate similar predictions for both of source images and target images, we incorporate a discriminator D in CellSegUDA. This discriminator takes source domain prediction or target domain prediction as input, and then distinguishes whether the input, i.e. prediction, comes from source domain or target domain. To train D, we use following cross-entropy loss:
\begin{equation}
L_{dis}(\hat{Y}) = - \frac{1}{H^\prime \times W^\prime} \sum_{h^\prime,w^\prime} { z.\log{(D(\hat{Y}))} + (1-z).\log{(1 - D(\hat{Y}))} },
\end{equation}
where z=0 when D takes target domain prediction as it's input, and z=1 when input comes from source domain prediction.

\subsection{CellSegSSDA}
In semi-supervised domain adaptation (SSDA) problem, we must make sure the best usages of available target domain annotations $Y_t$ while training our segmentation network S. In such scenarios, we extend our CellSegUDA framework to CellSegSSDA, a cell segmentation semi-supervised domain adaptation model.

In CellSegSSDA, for unannotated target images we do the same as CellSegUDA. However, when we encounter an annotated target data ($X_t^l, Y_t)$ while training, we additionally compute the segmentation loss $L_{seg}(X_t^l)$ in the similar manner to \equationref{eq:seg_loss_source}. Then, while computing the total loss we incorporate $L_{seg}(X_t^l)$ so that the segmentation network learns to generate the predictions closer to target ground-truths. Therefore, \equationref{eq:total_loss_uda} is now modified as below:
\begin{equation}
L_s(X_s, X_t^l) = L_{seg}(X_s) + L_{seg}(X_t^l) + \lambda_{adv} L_{adv}(X_t^l) + \lambda_{recons} L_{recons}(X_t^l)
\end{equation}

\subsection{Implementations}
In our work, we use U-Net \cite{unet2015ronneberger} as both of our segmentation network and decoder. We choose U-Net so that our proposed segmentation framework can be directly applied in other biomedical domains. We preferred U-Net over UNet++~\cite{nestedUnet2018zhou} because of the less number of parameters. Following DCGAN~\cite{discriminator2015radford}, we designed our discriminator consisting of five convolutional layers. To train CellSegUDA and CellSegSSDA, we followed the training strategy from GAN~\cite{gan2014goodfellow}. Adam optimizer~\cite{adam2014kingma} with learning rate 0.0001, 0.001 and 0.001 are used in segmentation network, discriminator and decoder respectively. We empirically choose 0.001 and 0.01 as $\lambda_{adv}$ and $\lambda_{recons}$ respectively. We do not use any data augmentation in our experiments.

\section{Experiments}
\subsection{Datasets}
\noindent \textbf{Dataset-1 (KIRC)} This dataset is taken from \citet{crowdsourcing2015irshad} in which images are extracted at 40x magnification from whole slide images (WSI) of Kidney Renal Clear cell carcinoma (KIRC). This dataset, referred as KIRC, consists of 486 H\&E stained histology images of $400 \times 400$ pixel size with annotations made by expert pathologists and research fellows. In our experiments, we randomly split KIRC into 80\% for training, 10\% for validation and 10\% for testing.

\noindent \textbf{Dataset-2 (TNBC)} \citet{deepRegression2018naylor} generated this dataset by collecting slides from Triple Negative Breast Cancer (TNBC) patients at 40x magnification. For a total of 50 H\&E stained histology images of pixel size $512 \times 512$, labeling was performed by expert pathologist and research fellows. We follow the same data splitting as KIRC for this dataset which we refer as TNBC.

\noindent \textbf{Visual differences among datasets} Although both datasets consist of H\&E stained histopathology images, they are collected from two different organs and different institutions. KIRC images are collected from TCGA portal (image acquiring tools are unknown to us), whereas TNBC images were acquired at Curie Institute using Philips Ultra Fast Scanner 1.6RA. Organ difference, institutional difference, and using different imaging tools and protocols cause the visual difference among the images from these two datasets. See \figureref{fig:motivation}, where TNBC image looks dimmer than KIRC image.

\subsection{Experimental results}
\textbf{Experiment-1 (KIRC $\rightarrow$ TNBC)} In our first experiment, we choose KIRC as source domain and TNBC as target domain, denoted by KIRC $\rightarrow$ TNBC. We start with our unsupervised domain adaptation (UDA) model CellSegUDA which gives much better accuracies than a UDA baseline DA-ADV \cite{udaCardiothoracic2018dong}. We also choose a fully-supervised model U-Net \cite{unet2015ronneberger} to get an idea how it performs when directly applying transfer learning, i.e. training with only KIRC and then test it on TNBC without any modifications, which is also considered as the lower-bound of experimental performance. This poor performance of transfer learning (see the first row of \tableref{tab:experimental_result}) happens because of the visual domain gap between source training images and target test images, also known as domain shift problem. \figureref{fig:visualization_1}(c) shows the visualization result of applying transfer learning in which many of the cells are missed out when comparing to the ground-truth. Then, training U-Net with TNBC-train and testing it on TNBC-test gives us the upper-bound (last row of \tableref{tab:experimental_result}). \tableref{tab:experimental_result} shows that, CellSegUDA gives 6.36 higher IoU\% than source-trained U-Net model. We see that, CellSegUDA also has 4.09 higher IoU\% than UDA baseline DA-ADV. We check the effect of our decoder network R by training CellSegUDA without reconstruction loss, denoted as CellSegUDA w/o recons in \tableref{tab:experimental_result}. We find that, reconstruction loss really makes our segmentation network more accurate (see \figureref{fig:visualization_1}(e)-(f) for visualization). \figureref{fig:visualization_1}(g) also shows that we can reconstruct input images using our decoder from corresponding segmentation prediction, thus we believe that our prediction is well-correlated with its input.

\begin{table}[t]
 % The first argument is the label.
 % The caption goes in the second argument, and the table contents
 % go in the third argument.
\floatconts
  {tab:experimental_result}%
  {\caption{Segmentation results for Experiment-1 and Experiment-2. IoU denotes intersection over union. Here, unsupervised domain adaptation (UDA) baseline is denoted as DA-ADV. CellSegUDA w/o recons, CellSegUDA and CellSegSSDA refer to our proposed UDA model without reconstruction loss, proposed UDA with reconstruction loss, and proposed semi-supervised domain adaptation method respectively. CellSegSSDA(source 100\% + target n\%) denotes n\% annotations available in TNBC-train and KIRC-train for experiment-1 and experiment-2 respectively. Results are from testing on TNBC-test and KIRC-test for experiment-1 and experiment-2 respectively.}}%
  {\begin{tabular}{ l|c|c|c|c| }
	    \cline{2-5}
        & \multicolumn{2}{|c|}{\textbf{Experiment-1}} & \multicolumn{2}{|c|}{\textbf{Experiment-2}}\\
        & \multicolumn{2}{|c|}{KIRC $\rightarrow$ TNBC} & \multicolumn{2}{|c|}{TNBC $\rightarrow$ KIRC}\\
		\cline{1-5}
        \multicolumn{1}{|l|}{\textbf{Method}} & \textbf{IoU\%} & \textbf{Dice score} & \textbf{IoU\%} & \textbf{Dice score}\\
		\hline
		\multicolumn{1}{|l|}{U-Net (source-trained)~\cite{unet2015ronneberger}} & 52.66 & 0.6875 & 54.82 & 0.7056 \\
		\hline
		\multicolumn{1}{|l|}{DA-ADV~\cite{udaCardiothoracic2018dong}} & 54.93 & 0.7079 & 55.43 & 0.7107 \\
		\hline
		\multicolumn{1}{|l|}{CellSegUDA w/o recons} & 56.56 & 0.72 & 56.91 & 0.7224 \\
		\hline
		\multicolumn{1}{|l|}{CellSegUDA} & 59.02 & 0.7394 & 57.09 & 0.7242 \\
		\hline
		\multicolumn{1}{|l|}{U-Net (source 100\% + target 10\%)} & 60.74 & 0.7534 & 56.89 & 0.7194 \\
		\hline
		\multicolumn{1}{|l|}{CellSegSSDA (source 100\% + target 10\%)} & 60.96 & 0.7557 & 58.81 & 0.7377 \\
		\hline
		\multicolumn{1}{|l|}{U-Net (source 100\% + target 25\%)} & 61.67 & 0.7607 & 59.32 & 0.7405 \\
		\hline
		\multicolumn{1}{|l|}{CellSegSSDA (source 100\% + target 25\%)} & 62.94 & 0.771 & 59.73 & 0.7443 \\
		\hline
		\multicolumn{1}{|l|}{U-Net (source 100\% + target 50\%)} & 56.73 & 0.7208 & 59.95 & 0.7464 \\
		\hline
		\multicolumn{1}{|l|}{CellSegSSDA (source 100\% + target 50\%)} & 63.59 & 0.7748 & 60.32 & 0.7494 \\
		\hline
		\multicolumn{1}{|l|}{U-Net (source 100\% + target 75\%)} & 59.06 & 0.7394 & 61.63 & 0.7592 \\
		\hline
		\multicolumn{1}{|l|}{CellSegSSDA (source 100\% + target 75\%)} & 64.96 & 0.7862 & 61.01 & 0.7541 \\
		\hline
		\multicolumn{1}{|l|}{U-Net (target-trained)} & 66.57 & 0.7985 & 62.04 & 0.7621 \\
		\hline
	\end{tabular}}
\end{table}

\begin{figure}[t]
\floatconts
  {fig:visualization_1}
  {\caption{Visualization of segmentation for KIRC$\rightarrow$TNBC. (g) shows that reconstructed target image (output from decoder) is quite similar to the input image which proves the efficacy of our proposed network. In (e)-(f) and (h)-(i), blue arrows indicate some missing cells of previous method. In (h) and (i), yellow arrows indicates false positives which are removed by following CellSegSSDA(50\%) and CellSegSSDA(75\%) respectively. Figure shows that, CellSegSSDA can identify more cells as the percentage of available annotations increases. This average-dense cell histopathology image in (a) is chosen so that the reader can easily find out the visual differences without further zooming-in.}}
  {\includegraphics[width=1\linewidth]{figure_3_haq20}} 
\end{figure}

Then, we assess our semi-supervised domain adaptation method CellSegSSDA for KIRC $\rightarrow$ TNBC. Source dataset, KIRC, is the same as UDA experiments. However, now we treat TNBC as partially labeled. We train CellSegSSDA considering 10\%, 25\%, 50\% and 75\% images from TNBC-train dataset has annotations available. Then, testing on TNBC-test gives us increasing IoUs and dice scores. This happens because more true positive cells can be identified and some false positive cells can be removed by CellSegSSDA as we train it with more target annotations (see \figureref{fig:visualization_1}(h)-(j)). We observe that, the accuracy of CellSegSSDA approaches to the upper-bound (only lower by 1.61 IoU\%) as we train with more annotations from target domain. We also compare CellSegSSDA with fully-supervised model U-Net to demonstrate the superiority of our SSDA model. This time, to train U-Net, we combine full KIRC dataset with the same 10\%, 25\%, 50\% and 75\% of TNBC-train we chose to train CellSegSSDA. As domain adaptation helps to reduce the domain shift problem, we see that CellSegSSDA outperforms fully-supervised model in all of the cases.\\

\noindent \textbf{Experiment-2 (TNBC $\rightarrow$ KIRC)} We conduct another experiment in the similar way to Experiment-1 by selecting TNBC as source and KIRC as target domain. This experiment also reflects the excellence of CellSegUDA and CellSegSSDA compared to other approaches in terms of segmentation accuracies (see last two columns of \tableref{tab:experimental_result}). Similar to experiment-1, we also see that segmentation accuracies of CellSegSSDA increase as more target images are annotated. Segmentation visualization from this experiment is shown in \figureref{fig:visualization_2}. From this experiment, we once again observe that CellSegUDA performs better than CellSegUDA w/o recons which proves the validity of our decoder and the effectiveness of reconstruction loss (see reconstructed image in \figureref{fig:visualization_2}(g)).

\section{Conclusion}
In this work, utilizing adversarial learning we propose a novel unsupervised domain adaptation (UDA) framework for segmenting cells in unannotated datasets. Prominent experimental results validate the effectiveness of our UDA model. Finally, assuming we have a few annotations available, we extend our work to semi-supervised domain adaptation (SSDA). To make our UDA model further accurate, we are planning to generate and utilize pseudo ground-truth masks for target domain in future. We expect our proposed UDA and SSDA approach to be very useful in other biomedical image segmentation tasks.

\begin{figure}
\floatconts
  {fig:visualization_2}
  {\caption{Visualization of segmentation for TNBC$\rightarrow$KIRC. In (f) and (j), blue arrows indicate missing cells of previous method. In (f) and (h)-(i), yellow arrows indicate a false positive which is removed by following method. Similar to \figureref{fig:visualization_1}, we chose this average-dense cell histopathology image for readability purposes.}}
  {\includegraphics[width=1\linewidth]{figure_4_haq20}}
\end{figure}

% Acknowledgments---Will not appear in anonymized version
\midlacknowledgments{This work was partially supported by US National Science Foundation IIS-1718853, the CAREER grant IIS-1553687 and Cancer Prevention and Research Institute of Texas (CPRIT) award (RP190107).}

\bibliography{haq20}

\end{document}
