% This is samplepaper.tex, a sample chapter demonstrating the
% LLNCS macro package for Springer Computer Science proceedings;
% Version 2.21 of 2022/01/12
%
\documentclass[runningheads]{llncs}
%
\usepackage[T1]{fontenc}
\usepackage{multirow}
\usepackage{makecell}
% T1 fonts will be used to generate the final print and online PDFs,
% so please use T1 fonts in your manuscript whenever possible.
% Other font encondings may result in incorrect characters.
%
\usepackage{graphicx}


% Used for displaying a sample figure. If possible, figure files should
% be included in EPS format.
%
% If you use the hyperref package, please uncomment the following two lines
% to display URLs in blue roman font according to Springer's eBook style:
% \usepackage{color}
%\renewcommand\UrlFont{\color{blue}\rmfamily}
% \urlstyle{rm}
%
\begin{document}
%
\title{3D Dental Arch Curve Detection from CBCT Images and Its Applications to Tooth Segmentation}
\titlerunning{3D Dental Arch Curve Detection}


\author{Benxiang Jiang \inst{1,2}\orcidID{0000-0001-5135-7630}\and
	Songze Zhang \inst{1,2}\orcidID{0000-0003-4548-4363}\and
	Jingyi Lyu \inst{1,2}\orcidID{0009-0005-4822-8877} \and
	Hongjian Shi* \inst{1,2}\orcidID{0000-0001-8732-4101}}
%
\authorrunning{Jiang et al.}
% First names are abbreviated in the running head.
% If there are more than two authors, 'et al.' is used.
%
\institute{Beijing Normal-Hong Kong Baptist University, Zhuhai, China \and 
Hong Kong Baptist University, Hong Kong, China\\
\email{shihj@uic.edu.cn}}

\maketitle  % 保持标题生成

\begin{abstract}
The three-dimensional (3D) dental arch curve, representing the spatial trajectory of dentition in either the maxilla or mandible, exhibits systematic alignment of tightly and orderly arranged teeth along its path. This structural configuration underscores its critical role as comprehensive anatomical guidance in digital dentistry, enabling high-precision tooth segmentation. In this study, we present a novel method for 3D dental arch curve detection from the volumetric cone beam computed tomography (CBCT) image, which, to our knowledge, represents the first successful implementation of 3D dental arch curve detection from the volumetric data. Specifically, we: (1) formulates and validates a dental arch curve fitting function, (2) identifies 3D uniformly distributed feature points proximal to the true dental arch curve through a feature point network framework, and (3) optimizes model parameters of the fitting function through a modified Expectation-Maximization (EM) algorithm with gradient descent. The proposed detection is then used to guide tooth segmentation through the curvilinear volume parameterization that unwind the vicinity of the dental arch curve. Experimental results demonstrate the accuracy for 3D dental arch curve detection and performance enhancements in the downstream task of tooth segmentation, improving segmentation precision compared to conventional approaches.

\keywords{CBCT  \and 3D Dental Arch Curve \and Tooth Segmentation \and EM Algorithm \and Digital Dentistry.}
\end{abstract}
%
%
%
\section{Introduction}
The dental arch constitutes the curved arrangement of teeth within the maxilla or mandible, with its morphology typically characterized through parametric curve representations \cite{1,2,3}. Along this critical anatomical feature, teeth exhibit precise spatial organization and are systematically and tightly aligned. For volumetric data processing, this anatomical feature enables the extraction of dentition region-of-interest (ROI) since the dental arch curve's vicinity works as a filter to preserve diagnostically relevant dentition regions as illustrated in Fig. 1.

The dental arch in the volumetric data set is three-dimensional (3D) that preserves authentic spatial inter-tooth relationships. However, current researches reveal an absence of robust algorithms for the detection of the 3D dental arch curve. Existing algorithms have succeeded in detecting dental arch curves with two-dimensional (2D) cone beam computed tomography (CBCT) projections \cite{3,4,5} or three-dimensional (3D) dental mesh surfaces \cite{6,7,8} through arch point detection and subsequent curve interpolation. In 3D volumetric space, on the other side, the critical challenge lies in reliably detecting arch points within the 3D CBCT image. This detection challenge hindering progress in detecting true 3D dental arch from the 3D CBCT image.

A specific curve can be described either by interpolation \cite{9} or fitting \cite{10} from given points. Interpolation defines the curve by passing through all given points and so require high accurate and reliable point detection. Fitting, on the other hand, utilizes given points to estimate parameters of a function. The function with estimated parameters fits a curve. In 3D dental arch curve detection from the volumetric data, detecting feature points uniformly distributed around the true 3D dental arch is practicable. Thus, fitting presents a more sensible strategy for 3D dental arch curve detection. Fitting based 3D dental arch curve detection involves three main challenges: 1. Formulation of a fitting function for the dental arch curve that suits the dental arch arrangement; 2. Automated detection of uniformly distributed feature points along the dental arch trajectory; and 3. Robust parameter estimation with latent variables that connect the feature points and the fitting function.

To resolve these challenges, this study proposes a three-stage fitting-based method for 3D dental arch curve detection in the 3D CBCT image as shown in Fig. 1. The method comprises: 1. A parametric curve equation to fit the dental arch curve; 2. A feature point network framework to identify uniformly distributed feature points proximal to the true dental arch curve; 3. A modified Expectation-Maximization (EM) algorithm \cite{11} with the gradient descent \cite{12} to optimize parameters and latent variables. 

The clinical applications of 3D dental arch curves are primarily in guiding tooth segmentation, the task that segments and numbers individual tooth within the 3D CBCT image. Therefore, we also propose a curvilinear volume parameterization method based on the 3D dental arch curve in this study, as illustrated in Fig. 1. Through this parameterization, the dentition region within the CBCT image can be transformed into two curvilinear volumes as two narrow cuboid volumes specifically designed to localize the maxillary and mandibular dentitions, respectively. Within each curvilinear volume, all maxillary or mandibular teeth are closely and orderly arranged from left to right and constitute the dominant region of the space. In contrast, within the original CBCT image, teeth exhibit an arch-shaped arrangement, and the dentition occupies only a minor portion of the overall volume. Consequently, compared to performing segmentation directly within the CBCT space, our proposed curvilinear volume parameterization method, based on the 3D dental arch curve, serves as an effective plug-and-play tool to enhance the accuracy of existing tooth segmentation methods.
To validate the efficacy of the curvilinear volume parameterization method based on the 3D dental arch curve, we conducted comprehensive tests using several baseline segmentation methods, including nnUNet 2D \cite{21}, nnUNet 3D \cite{20}, SegResNet \cite{25}, and MedNext \cite{26}. The experimental results demonstrate that curvilinear volume parameterization, functioning as a plug-and-play tool, effectively improves tooth segmentation accuracy.

\begin{figure}
\vspace{-0.4cm}
  \centering
	\includegraphics[totalheight=2.3in]{fig1.pdf}
	\caption{Overview of the proposed method for fitting 3D dental arch curves, and serving as a plug-and-play tool for segmenting individual teeth from a 3D CBCT image. a. The input 3D CBCT image. b. Proposed 3D dental arch curve detection. c. Curvilinear volume parameterization to transform the CBCT image into two narrow cuboid volumes where teeth are closely and orderly arranged from left to right. d. Tooth segmentation implementation in the curvilinear volumes. e. Curvilinear volume parameterization to transform the segmented teeth into the CBCT image.}
\vspace{-1cm}
\end{figure}

\section{Methods}

\subsection{Dental Arch Curve Fitting Function}
Contemporary orthodontic research emphasizes that any plan of dental arch determination must be flexible enough to produce arches varying in form through a parabola, cubic parabola, etc. \cite{2}. Therefore, our 3D dental arch curve fitting function is a parametric curve that combines two cubic parabolas and a linear polynomial to capture both anatomical curvature and alveolar bone orientation:
\begin{equation}
\vec{C}(u) = \left( x(u), y(u), z(u) \right) = \left( 
\begin{array}{c} 
	\theta_1 u + \theta_2 u^2 + \theta_3 u^3 + \theta_4 \\ 
	\theta_5 u + \theta_6 u^2 + \theta_7 u^3 + \theta_8 \\ 
	\theta_9 u^2 + \theta_{10} u + \theta_{11} 
\end{array} 
\right) 
\end{equation}
where $u\in[0,1]$ parameterizes the dental arch trajectory in the DICOM coordinate system (x-axis: Left to Right, y-axis: Anterior to Posterior, z-axis: Inferior to Superior) \cite{17} and $\{\theta_1,…,\theta_11 \}$are unobserved parameters for curve fitting.
The parametric curve in Equation (1) achieves both anatomical fidelity and computational efficiency. The cubic parabola terms describe the natural variations and smooth transitions of the arch-shaped structure of the dental arch curve. The parabola term approximates the orientation of the alveolar bone. The 11 parameters in Equation (1) balances complexity of the fitting function and the optimization feasibility. The three polynomial expressions in Equation (1) enable derivatives for parameter estimation.

\subsection{Feature Point Network Framework}
Our feature point network framework processes a 3D CBCT image to uniformly distributed feature points along the maxillary and mandibular dental arch trajectories, as illustrated in Fig. 1. The critical component of the framework is ground truth generation. After collecting ground truths, we employ a 3D residual encoder U-Net \cite{19,20} implemented within the nnU-Net framework \cite{21}. The nnU-Net framework automatically configures hyperparameters verified in segmentation tasks \cite{20,22}. This approach transforms the feature point detection task into a simpler binary volume segmentation problem. All segmented foreground voxels within the network output can subsequently be utilized as feature points for dental arch curve detection.

We propose an algorithm to generate ground truth feature points from manual tooth segmentation masks \cite{13,15}, addressing the labor-intensive challenges of manual feature point annotation along 3D dental arches. The procedure initiates by fitting a parabolic curve to the axial projection of tooth centroids:
\begin{equation}
	\xi(x) = \beta_1 x + \beta_2 x^2 + \beta_3
\end{equation}
where parameters $\beta_1,\beta_2,\beta_3$ are optimized through least squares estimation \cite{23} from the axial coordinates of all maxillary/mandibular tooth voxels. To ensure uniform feature point distribution, the parabola in Equation (2) undergoes uniform discrete sampling by $x_n = t((n-0.5)d),\ n\in \{1,...,N\}$, where $t(\cdot)$ represents the inverse function of the arc length function of the parabola, $d$ is the interval, and $N$ specifies the feature point count. At each discrete point $x_n$, the orthogonal plane perpendicular to the tangent vector of $x_n$ is computed as $x+(\beta_1+2\beta_2 x_n )y-x_n-(\beta_1+2\beta_2 x_n )\xi(x_n )=0$. Feature points are defined as centroids of the intersection areas between these planes and the maxillary/mandibular tooth volumes. These centroids are encoded in 3D label maps with label 1 for maxillary feature points and label 2 for mandibular feature points and processed with $5×5×5$ morphological dilation to create network training targets. This automated pipeline ensures anatomical accuracy while eliminating manual annotation inconsistencies.

\subsection{Modified EM algorithm with Gradient Descent}
EM algorithm is an iterative statistical estimation method, particularly effective for parameter optimization in latent variables \cite{11}. Its robustness in handling latent variables makes it particularly suitable for 3D curve fitting challenges. The parameter estimation for Equation (1) employs a modified Expectation-Maximization (EM) framework that integrates gradient descent optimization \cite{12} to address latent variable challenges in 3D curve fitting. This hybrid approach combines the statistical rigor of EM with numerical optimization capabilities.

The initialization step begins with ordered feature point coordinates $\{\vec{P}_1,\dots,$ $\vec{P}_N\} = \{(x_1,y_1,z_1),\dots,(x_N,y_N,z_N)\}$ sorted by ascending $x$-values. Each feature point associates with a latent parameter $u_i$ for $i \in \{1,\dots,N\}$, initialized through centripetal parameterization \cite{24}: $u_i = u_{i-1} + \frac{\|\vec{P}_i - \vec{P}_{i-1}\|^{1/2}_2}{\sum_{j=2}^N \|\vec{P}_j - \vec{P}_{j-1}\|^{1/2}_2}$, with $u_1 = 0$. The error function quantifies cumulative deviation by $E = \sum_{i=1}^N \|\vec{P}_i - \vec{C}(u_i)\|^2_2$. In the maximization step, the partial derivative $\frac{\partial E}{\partial \theta_x} = 0$ gives the update for $\theta_x = (\theta_1,\theta_2,\theta_3,\theta_4)$, with analogous updates for $\theta_y = (\theta_5,\theta_6,\theta_7,\theta_8)$ and $\theta_z = (\theta_9,\theta_{10},\theta_{11})$. In the Expectation step, the latent variables $u_1,\dots,u_N$ are optimized via gradient descent with learning rate $\eta$: $u_i^{(k+1)} = u_i^{(k)} - \eta \frac{\partial E}{\partial u_i}$, $i=1,\dots,N$ where superscript $k$ denotes iteration index. $\frac{\partial E}{\partial u_1},\dots,\frac{\partial E}{\partial u_N}$ are computed through chain rule differentiation of the error function. In the iteration step, iteration alternates between coefficient updates and latent variable optimization until convergence or fixed iteration numbers. This dual optimization strategy combines the global convergence properties of EM with local refinement through gradient descent, thus balancing efficiency and accuracy.

\subsection{Curvilinear Volume Parameterization}
Given a fitted dental arch curve $\vec{C}_{{fit}}(u)$, we define tubular coordinates as $\{(x,y,$
$z) | (x,y,z) = \vec{C}_{{fit}}(u) + \alpha\vec{B}(u) + \gamma\vec{N}(u), u \in [0,1], \alpha \in [-40,40], \gamma \in [t_1,t_2]\}$, where $\vec{T}(u) = \frac{\vec{C}_{{fit}}'(u)}{|\vec{C}_{{fit}}'(u)|}$, $\vec{N}(u) = \frac{\vec{T}'(u)}{|\vec{T}'(u)|}$, and $\vec{B}(u) = \vec{T} \times \vec{N}$ are the unit tangent, normal, and binormal vectors, $[t_1,t_2] = [-40,56]$ for the maxillary teeth and $[-56,40]$ for the mandibular teeth. Let the length of $\vec{C}_{{fit}}(u)$ with $u \in [0,1]$ be $L$. This tubular coordinates unwinds the vicinity of the dental arch curve $\vec{C}_{{fit}}(u)$ into a rectilinear 3D volume $V \in \mathcal{R}^{L\times80\times96}$ through discretely sampling $R_v$ at $\Delta u = 1/L$, $\Delta\alpha = \Delta\gamma = 1$ using bicubic interpolation and  $(u,\alpha,\gamma) \leftarrow (x,y,z)$ via diffeomorphic mapping. This unwinding process is reversible naturally.

\section{Experiments and Discussions}

\subsection{Materials}

This study utilizes a hybrid dataset of 110 3D CBCT images with corresponding voxel-level tooth segmentation ground truth volumes, comprising 98 cases from \cite{13,14} and 12 cases from \cite{15}. The dataset \cite{13,14} contains 4531 CBCT volumes, of which 148 are publicly available. Among these 148 volumes, 50 are small field-of-view (FOV) CBCT images lacking complete maxillary and mandibular structures, while the remaining 98 large FOV CBCT volumes constitute our utilized subset. The dataset \cite{15} comprises 12 CBCT volumes, all of which were employed in this study. The hybrid dataset encompasses 15 distinct acquisition protocols with spatial resolutions ranging from 0.25×0.25×0.27 mm³ to 0.4×0.4×0.4 mm³ and field-of-view dimensions spanning 12.1×12.1×8.51 cm³ to 16×16×13.1 cm³.  To address the absence of manual tooth numbering, we implemented the FDI World Dental Federation notation system \cite{16} as illustrated in Fig. 1 through manual labeling, creating a classification strategy comprising 33 distinct anatomical categories: 32 permanent tooth identifiers (combining 4 jaw quadrants and 8 tooth types) plus background. 

\subsection{Experimental Setup} 
Experiments were performed on a GIGABYTE G292-Z42 workstation featuring an Intel Xeon Platinum 8352V processor, NVIDIA RTX 4090 GPU, NVIDIA L20 GPU, and 64GB DDR4 memory, operating under Ubuntu 22.04 LTS. From the complete dataset of 110 CBCT scans with voxel-level annotations, we employed stratified sampling to construct training (88 cases) and testing (22 cases) cohorts while preserving anatomical diversity and scanner manufacturer balance. The training set comprised 79 scans from \cite{13,14} and 9 cases from \cite{15}, while the test set included 19 scans from \cite{13,14} and 3 from \cite{15}. This partitioning strategy ensured representative coverage of both conventional and challenging dental arch morphologies across different imaging protocols.

\vspace{-0.41cm}

\subsection{Feature Point Detection Performance}
Since the detected feature points reside within the CBCT volumetric space and are represented as small cubic regions, feature point detection accuracy was quantified through the Dice Similarity Coefficient (DSC) \cite{27}, defined as $DSC = \frac{2|P \cap G|}{|P| + |G|}$, where $P$ and $G$ denote predicted and ground truth feature point regions. The range of DSC is [0,1], with a larger value indicating better prediction accuracy. As shown in Fig. 2(a), our feature point network achieves mean DSC scores of $85.39 \pm 3.81\%$ (maxillary feature points, Class 1) and $83.9 \pm 0.036\%$ (mandibular feature points, Class 2), demonstrating its localization accuracy. Notably, case 5 (DSC$=74.43\%$ for Class 1) and case 9 (DSC$=72.39\%$ for Class 2) presented unique challenges: case 5 exhibited metal artifacts in the maxillary region with partial dentition loss, while case 9 contained two impacted mandibular wisdom teeth with associated positional anomalies. 

Visual analysis of these challenging cases as shown in Figs. 2(b)-(c) revealed three main characteristics: True positive regions (blue regions) consistently captured essential dental arch trajectory features despite anatomical complexities; false negative regions (red regions) predominantly occurred in interproximal regions where feature point ambiguity naturally exists; and false positive regions (green regions) localized to regions excluded from natural dental arch trajectory, specifically metal artifacts in case 5 and impacted mandibular wisdom teeth in case 9. This strategic error distribution patterns in Figs. 2(b)-(c) indicate the feature point network learned to prioritize anatomically meaningful feature points. 

\subsection{Dental Arch Curve Fitting Analysis}
The convergence characteristics of our modified EM algorithm are demonstrated through progressive curve fitting outcomes across multiple iterations as shown in Fig. 2(d). Employing 1,000 gradient descent steps with a conservative learning rate $\eta = 1 \times 10^{-6}$ per EM iteration, the method achieves acceptable accuracy within just one iteration cycle. While increased iterations (10-50) further refine the fit, diminishing returns become evident, as evidenced by near-identical 10- and 50-iteration fitting function curves in Fig. 2(d). This rapid convergence stems from the algorithm's hybrid optimization strategy that synergizes partial derivative parameter solutions with gradient descent-based latent variable updates. Computational efficiency analysis reveals linear time scaling relative to iteration count, with single-iteration processing requiring $0.394 \pm 0.047$ seconds for maxilla and $0.367 \pm 0.052$ seconds for mandible seconds and 10 iterations requiring $3.664 \pm 0.414$ seconds for maxilla and $3.643 \pm 0.549$ seconds for mandible. The network’s ability to maintain feature points’ anatomical plausibility, even in suboptimal detection scenarios, confirms its robustness for the subsequent dental arch curve fitting procedure.

\begin{figure}
	\vspace{-0.35cm}
	\centering
	\includegraphics[totalheight=0.9in]{fig2.pdf}
	\caption{Evaluations of dental arch curve detection. a. Accuracy of feature point detection. b. Feature point detection results of Case 5. c. Feature point detection results of case 9. d. A case for dental arch curve fitting with 1, 10, and 50 EM iteration cycles. }
	\vspace{-1cm}
\end{figure}

\subsection{Feasibility Analysis of Dental Arch Curve Fitting Function}
When defining the fitting function in Equation (1), we assume that this fitting function can fit a 3D dental arch curve that primarily lies around a plane. This hypothesis of dental arch morphology was validated through geometric analysis of 220 fitted curves (110 in maxilla, 110 in mandible) from their corresponding ground truth feature points. For each fitted curve, we computed the optimal approximation plane by minimizing the orthogonal distance. All orthogonal distances are larger than 0, with mean orthogonal deviation of $0.053 \pm 0.056$ mm. This confirms the feasibility of our parametric curve fitting function in capturing the near-planar 3D dental arch curve.

\subsection{Curvilinear volume parameterization for tooth segmentation}
We propose curvilinear volume parameterization to establish 3D dental arch detection as a plug-and-play tool for tooth segmentation.To validate this tool's efficacy, we compared four popular segmentation architectures: nnU-Net 2D \cite{21}, nnU-Net 3D \cite{20}, SegResNet \cite{25}, and MedNext \cite{26}. For each architecture, training and testing were performed separately on both: (1) the original 3D CBCT volumes, and (2) their transformed cuboid volumes generated through curvilinear volume parameterization. Comparative analysis extends to recent tooth segmentation methods \cite{14,5,28,29,30,31} with their reported performance metrics and 3D CBCT images used. Quantitative results are presented in Table 1. Let TP, TN, FP, FN represent true positives, true negatives, false positives, and false negatives, three metrics \cite{27} quantify segmentation accuracy including $Dice = \frac{2TP}{2TP + FP + FN}$, $Precision= \frac{TP}{TP + FP}$, and $Recall = \frac{TP}{TP + FN}$. Experimental results show that the dental arch curve successfully guides tooth segmentation, achieving segmentation metrics equivalent to state-of-the-art methods.

\begin{table}[h]
	\vspace{-0.3cm}
	\centering
	\caption{Comparison with existing methodologies in individual tooth segmentation}
	\label{tab:comparison}
	\begin{tabular}{|l|c|c|c|c|c|}
		\hline
		\multirow{2}{*}{Methodology} & \multirow{2}{*}{\makecell{Dental arch\\ guide}} & \multirow{2}{*}{\makecell{3D CBCT\\ images used}} & \multicolumn{3}{c|}{Metrics (\%)} \\ \cline{4-6}
		& & & Precision & Dice & Recall \\ \hline
		\multirow{2}{*}{nnUNet 2D \cite{21}} & No & \multirow{2}{*}{110} & 74.05 & 72.15 & 71.34 \\ \cline{2-2} \cline{4-6}
		& Yes & & 93.83 & 93.57 & 93.30 \\ \hline
		\multirow{2}{*}{nnUNet 3D \cite{20}} & No & \multirow{2}{*}{110} & 74.07 & 72.37 & 72.77 \\ \cline{2-2} \cline{4-6}
		& Yes & & 93.72 & 93.91 & 94.09 \\ \hline
		\multirow{2}{*}{SegResNet \cite{25}} & No & \multirow{2}{*}{110} & 74.47 & 73.34 & 74.25 \\ \cline{2-2} \cline{4-6}
		& Yes & & 93.66 & 93.88 & 94.10 \\ \hline
		\multirow{2}{*}{MedNext \cite{26}} & No & \multirow{2}{*}{110} & 74.10 & 72.66 & 73.34 \\ \cline{2-2} \cline{4-6}
		& Yes & & 94.33 & 94.33 & 94.32 \\ \hline
		Cui et al. \cite{14} & - & 20 & - & 91.98 & - \\ \hline
		Jang et al. \cite{5} & - & 97 & 95.97 & 94.79 & 93.71 \\ \hline
		Li et al. \cite{28} & - & 350 & 92.13 & 91.13 & 91.23 \\ \hline
		Tan et al. \cite{29} & - & 314 & - & 95.78 & - \\ \hline
		Shaheen et al. \cite{30} & - & 186 & - & 90 & - \\ \hline
		Liu et al. \cite{31} & - & 451 & - & 94.3 & - \\ \hline
	\end{tabular}
	\vspace{-1cm}
\end{table}

\section{Acknowledgments}
This work was supported in part by the Guangdong Higher Education Key Platform and Research Project under Grant 2020ZDZX3039, in part by the Guangdong Provincial Key Laboratory of Interdisciplinary Research and Application for Data Science under Grant 2022B1212010006.

\section{Conclusion}
This study first proposes 3D dental arch curve detection from volumetric CBCT image and demonstrates that precise 3D dental arch curve detection serves as a plug-and-play tool for automated tooth segmentation. Experimental results show our 3D dental arch curve detection is accurate and robust. The dental arch curve guided tooth segmentation benchmarking methodologies are much more accurate than the corresponding benchmarking methodologies without dental arch curve guide.

%
% ---- Bibliography ----
%
% BibTeX users should specify bibliography style 'splncs04'.
% References will then be sorted and formatted in the correct style.
%

\bibliographystyle{splncs04}
\bibliography{mybibliography}


\end{document}
