\documentclass[
  journal=proceedings,
  manuscript=article-type,
  year=2024
]{PMET_proc}

\usepackage{amsmath}
\usepackage[nopatch]{microtype}
\usepackage{booktabs}
%\usepackage{orcidlink}
%\newcommand{\orcidauthor}[2]{#1~\orcidlink{#2}}

\title{Some Posterior Standard Deviations of the Graded Response Model}
%\author{\orcidauthor{Seock-Ho Kim}{0000-0002-2353-7826}}
\author{Seock-Ho Kim}
\affiliation{Department of Educational Psychology, University of Georgia, Athens, GA 30602, USA}
\email[Seock-Ho Kim]{shkim@uga.edu}

%\author{S. Author}
%\affiliation{Second Division, Organization, City, Pincode, State, Country}
% \alsoaffiliation{Joint first authors}

%\author{T. Author}
%\affiliation{Second Division, Organization, City, Pincode, State, Country}

%\author{F.T. Author}
%\affiliation{Fourth Division, Organization, City, Pincode, State, Country}

\addbibresource{exampleSHK.bib}

\keywords{Bayes modal estimation, graded response model, item response theory, posterior standard deviations} %% First letter not capped

\begin{document}

\begin{abstract}
The procedures required to obtain the approximate posterior standard deviations of the parameters of the graded response model for polytomously scored items from Bayes modal estimation are described and used to generate values for some common situations.  
The results were compared with those obtained from maximum likelihood estimation.  
It is shown that the use of priors may reduce the instability of Bayes modal estimates of the item parameters assuming the choice of priors is reasonable.  
The sample size required for acceptable accuracy for purposes of practical applications of item response theory may be inferred from the tables or the computer code in R.  
It is suggested that careful selection and specifications of priors be exercised to obtain the required precision when the graded response model is used in these situations.
\end{abstract}


\section{Introduction}
Thissen and Wainer (1982) presented the magnitudes of the asymptotic standard errors of estimated item parameters in the three commonly used IRT models for binary items.   
The standard errors were obtained using maximum likelihood estimation and presented in a convenient form
assuming that one examinee, randomly sampled from a population of a Gaussian distribution with zero mean and unit variance, responded to the item.  
Based on the required precision and the values of item parameters, the readers can find a minimum sample size to achieve the accurate estimation of item parameters.
Kim (2023) extended Thissen and Wainer's approach to the graded response model (Samejima, 1969, 1972), one of the IRT models for polytomous items.

The effect of the priors of item parameters on the approximate posterior standard deviations from Bayes modal estimation for the three IRT models for binary items is presented in Kim (2007).
Such effect is not well known, however, for the IRT models for polytomous items.  
A number of different forms of priors have been proposed in the estimation of item parameters of the graded response model (see Kim, 2024, and references there in) and implemented in various IRT computer programs, for example, PARSCALE (Muraki \& Bock, 1993, 2002; see also  du Toit, 2003), MULTILOG (Thissen, 1991; Thissen, Chen, \& Bock, 2002), and flexMIRT (Houts \& Cai, 2013).
This paper used the priors in the computer program PARSCALE.


\section{Estimation and Posterior Standard Deviations}

\subsection{Bayes Modal Estimation}
If the item response model is a function of ability $\theta_{i}$ for an examinee $i$ and a set of item parameters $\xi$, the probability of a response $k$ to the item can be written as
\[
P_{ik} = P(r_i = k | \theta_i, \xi),
\]
where $r_i$ is the examinee's response.
The likelihood function of the observed responses for $N$ independent examinees is (with an indicator variable $u_{ik}=1$ for $r_i = k$ and $u_{ik}=0$ otherwise)
\[
L = \prod_{i=1}^{N} \prod_{k=1}^{K} P_{ik}^{u_{ik}}.
\]

Let $l = \sum_{i=1}^{N} \sum_{k=1}^{K} u_{ik} \log P_{ik}$ be the log likelihood and $\pi = \log p(\xi)$ be the log prior of $\xi$.
From Bayes theorem, the log posterior is proportional to the log likelihood and the log prior,
\[
\log
{\rm posterior} 
\propto 
l + \pi 
= \sum_{i=1}^{N} \sum_{k=1}^{K} u_{ik} \log P_{ik}
+ \log p(\xi).
\]
The Bayes modal estimates of item parameters in $\xi$ are located where the partial derivatives
\[
\frac{\partial (l + \pi)}{\partial \xi} 
= \sum_{i=1}^{N} \sum_{k=1}^{K} 
\frac{u_{ik}}{P_{ik}} \frac{\partial P_{ik}}{\partial \xi} 
+ \frac{\partial \pi}{\partial \xi}
\]
are zero.

If the log posterior has a well-defined maximum, the degree of concavity would determine the sampling variances of the modal estimates.
The second partial derivatives of the log posterior can be obtained
for any parameter $\xi_{s}$ and $\xi_{t}$.
The second partial derivatives of the log posterior have the form
%{\scriptsize 
\begin{equation}
\frac{\partial^2 l}{\partial \xi_{s} \partial \xi_{t}}
+ \frac{\partial^2 \pi}{\partial \xi_{s} \partial \xi_{t}} 
=  
\sum_{i=1}^{N} \sum_{k=1}^{K} \left\{ \frac{u_{ik}}{P_{ik}} 
\frac{\partial^2 P_{ik}}{\partial \xi_{s} \partial \xi_{t}} +
\frac{\partial P_{ik}}{\partial \xi_{s}}
\left( \frac{- u_{ik}}{P_{ik}^{2}} \right)
\frac{\partial P_{ik}}{\partial \xi_{t}}
\right\}
+ \frac{\partial^2 \pi}{\partial \xi_{s} \partial \xi_{t}}.
\end{equation}
%}
The inverse of the negative value of the matrix of second derivatives of the log posterior approximates the asymptotic variance and covariance matrix of the Bayes modal estimates (Berger, 1985; Mislevy, 1986; Tsutakawa \& Johnson, 1990).  

For the likelihood part, the density of $\theta$ with the subscript $i$ omitted is taken to be $\phi(\theta)$, and we obtain the expectation of the second partial derivatives by substituting $P_{k}$ for $u_{k}$ with the subscript $i$ omitted. We simplify and integrate, thus obtaining
\begin{equation}
- E \left( \frac{\partial^2 l}{\partial \xi_s \partial \xi_t} \right) =
N \int_{- \infty}^{\infty} \sum_{k=1}^{K} \left\{ 
\left( \frac{1}{P_k} \right) \left( \frac{\partial P_{k}}{\partial \xi_s} 
\frac{\partial P_{k}}{\partial \xi_t} \right)
\right\} \phi(\theta) d \theta.
\end{equation}
The partial derivatives of $P_k$ with respect to its parameters and the specification of $\phi(\theta)$ are needed for the evaluation of Equation 2.  
The density of $\theta$, $\phi(\theta)$, is assumed to be Gaussian with mean zero and variance one.


\subsection{Derivatibes of Item Response Functions}
The graded response model in the logistic form for $k = 1, \ldots K$ is
\[
P_{k} = P_{k-1}^{*} - P_{k}^{*},
\]
where
\[
P_{k-1}^{*} = \frac{1}{1 + \exp\{ -a(\theta - b_{k-1})\}}
\] 
and
\[
P_{k}^{*} = \frac{1}{1 + \exp\{ -a(\theta - b_{k})\}}
\]
in which $a$ is the slope parameter of the boundary response function, and $b_{k-1}$ and $b_{k}$ are the location parameters.
Note that $P_{0}^{*} = 1$ (i.e., $b_{0} \equiv - \infty$) and $P_{K}^{*} = 0$ (i.e., $b_{K} \equiv \infty$) by definition.

The partial derivatives of the graded response model for the respective parameters are
\[
\frac{\partial P_{k}}{\partial a} =
\frac{\partial P_{k-1}^{*}}{\partial a} -
\frac{\partial P_{k}^{*}}{\partial a}
=
P_{k-1}^{*} Q_{k-1}^{*} (\theta - b_{k-1}) -
P_{k}^{*} Q_{k}^{*} (\theta - b_{k})
\]
and 
\[
\frac{\partial P_{k}}{\partial b_{k}} =
\frac{\partial P_{k-1}^{*}}{\partial b_{k}} -
\frac{\partial P_{k}^{*}}{\partial b_{k}}
=
P_{k}^{*} Q_{k}^{*}(-a),
\]
where $Q_{k-1}^{*} = 1 - P_{k-1}^{*}$ and $Q_{k}^{*} = 1 - P_{k}^{*}$.


With $w_{k} = P_{k}^{*} Q_{k}^{*}$ we can obtain:
%{\tiny 
\[
- E \left( \frac{\partial^{2} l}{\partial a^{2}} \right) =
N \int_{-\infty}^{\infty} \sum_{k=1}^{K} \left[ 
\left( \frac{1}{P_{k}} \right) 
\{ w_{k-1}(\theta - b_{k-1}) - w_{k}(\theta - b_{k}) \}^{2}
\right] \phi(\theta) d\theta
\]
\[
- E \left( \frac{\partial^{2} l}{\partial b_{k}^{2}} \right) =
N \int_{-\infty}^{\infty} (-a w_{k})^{2}  
\left( \frac{1}{P_{k}} + \frac{1}{P_{k+1}} \right) 
\phi(\theta) d\theta
\]
\[
- E \left( \frac{\partial^{2} l}{\partial b_{k-1} \partial b_{k}} \right) =
-
N \int_{-\infty}^{\infty} a^{2} w_{k-1} w_{k}  
\left( \frac{1}{P_{k}} \right) 
\phi(\theta) d\theta
\]
\[
- E \left( \frac{\partial^{2} l}{\partial b_{k} \partial b_{k+1}} \right) =
-
N \int_{-\infty}^{\infty} a^{2} w_{k} w_{k+1}  
\left( \frac{1}{P_{k+1}} \right) 
\phi(\theta) d\theta
\]
\[
- E \left( \frac{\partial^{2} l}{\partial a \partial b_{k}} \right) =
-
N \int_{-\infty}^{\infty} a (\theta - b_{k}) w_{k}   
\left( \frac{(w_{k-1} - w_{k})}{P_{k}} - \frac{(w_{k} - w_{k+1})}{P_{k+1}} \right) 
\phi(\theta) d\theta
\]
%}
The similar derivatives are given by Baker (1992, pp.\ 233--236) and elsewhere. 


\subsection{Derivatives of Priors}
For the graded response model, a lognormal distribution (Hogg \& Craig, 1978, p.\ 180) with $\mu_{\log a}$ and $\sigma_{\log a}^{2}$ for $a$,
\[
p(a) = \left\{ 
\begin{array}{ll}
\displaystyle 
\frac{1}{\sqrt{2 \pi} \sigma_{\log a}} \exp \left[ - \frac{1}{2} 
\left( \frac{\log a - \mu_{\log a}}{\sigma_{\log a}} \right)^{2} \right] \frac{1}{a} & \mbox{if $0 < a < \infty$} \\
0 & {\rm otherwise},
\end{array}
\right.
\] 
can be employed in PARSCALE.  
The second derivative of the log prior for $a$ is
\[
\frac{\partial^{2} \log p(a)}{\partial a^{2}} =
- \frac{1 - (\log a - \mu_{\log a} + \sigma_{\log a}^{2})}
{\sigma_{\log a}^{2} a^{2}}.
\]

A normal distribution (Hogg \& Craig, 1978, p.\ 111) with $\mu_{b_k}$ and $\sigma_{b_k}^{2}$ can be taken as the prior for $b_k$ in PARSCALE,
\[
p(b_k) = \frac{1}{\sqrt{2 \pi} \sigma_{b_k}} \exp 
\left[ - \frac{1}{2} \left( \frac{b_{k} - \mu_{b_k}}{\sigma_{b_k}} \right)^{2}  \right] \ \ \mbox{for $-\infty < b_{k} < \infty$}.
\]  
The second partial derivative of the log prior for $b_{k}$ is
\[
\frac{\partial^{2} \log p(b_{k})}{\partial b_{k}^{2}} =
- \frac{1}{\sigma_{b_{k}}^{2}}.
\]
It is assumed later that $\sigma_{b}^{2}$ are the same for all $k$.


\section{Method}
Since priors do not depend on the $N$ examinees, the magnitudes of the approximate posterior standard deviations cannot be tabulated in a convenient form as in Thissen and Wainer (1982) and in Kim (2023).
The approximate posterior standard deviations depend on both $N$ and priors.
The contribution of the priors to the magnitude of the approximate posterior standard deviations will be affected by sample size rather unsystematically because of the inversion of the matrix of the second derivatives.
A set of R code was developed to obtain the approximate posterior standard deviations
for the graded response model with two to nine categories.

To compare the asymptotic standard errors from the maximum likelihood method and the approximate posterior standard deviations, two sample sizes ($N=100$ and $N=1000$) are used to obtain the main results presented in the next section.
Other interesting results from different sample sizes are also reported.
For the graded response model with $k$ categories, the priors were a lognormal prior on $a$ with $\mu_{\log a}=0$ and $\sigma_{\log a}^{2}=0.5^{2}$ and normal priors on $b_k$ with $\mu_{b_k}=0$ and $\sigma_{b_k}^{2}=2^{2}$.


\section{Results}
The results obtained through the use of Equation 1 (i.e., posterior standard deviations) and Equation 2 (i.e., standard errors) could be shown for various situations.
Table 1 is presented here as a summary
(n.b., Tables 2--9 are not presented here but available from the author):
For example,   
Tables 2--3 for the posterior standard deviations for the graded response model with two categories (GR2) with 100 and 1000 examinees,  
Tables 4--5 for the standard errors for GR2 with 100 and 1000 examinees,
Tables 6--7 for the posterior standard deviations for GR3 with 100 and 1000 examinees, and
Tables 8--9 for the standard errors for GR3 with 100 and 1000 examinees.
Other possible tables for GR4 to GR9 are too voluminous to present.
Note that results from Tables 2--9 are summarized with Figures 1--5.


\begin{table}[hbt!]
\caption{\textit{Sample Size Required to Achieve One Decimal Place of Accuracy for Location and Slope for the Graded Response Model with Two to Nine Categories (GR2--GR9) When Slope Is 1.5 and the Locations Range $-2$ to $+2$ with Increment of $0.5$ from Bayes Modal Estimation with Normal Priors of $N(0, 2^2)$ on Location and Lognormal Prior of $LN(0, 0.5^2)$ on Slope and from Maximum Likelihood Estimation (MLE)}}
%{\footnotesize
%\scriptsize 
%\small
\begin{tabular}{llrrl}
%\\
%\hline
%\\
\toprule
\headrow
Model & Parameter & Sample Size & MLE Sample Size & Example Set ($a$, $b$'s) \\
\midrule
%\\
%\hline
%\\
GR2 & Location & 7493 & 7500 & (1.5, -2.0) \\
    & Slope    & 8897 & 8912 & (1,5, -2.0) \\
%\\
GR3 & Location & 4026 & 4020 & (1.5, -2.0,  2.0) \\
    & Slope    & 4640 & 4652 & (1.5, -2.0, -1.5) \\
%\\
GR4 & Location & 3414 & 3411 & (1.5, -2.0, -1.5,  2.0) \\
    & Slope    & 2844 & 2852 & (1.5, -2.0, -1.5, -1.0) \\
%\\
GR5 & Location & 3024 & 3025 & (1.5, -2.0, -1.5, -1.0,  2.0) \\
    & Slope    & 1945 & 1954 & (1.5, -2.0, -1.5, -1.0, -0.5) \\
%\\
GR6 & Location & 2777 & 2788 & (1.5, -2.0, -1.5, -1.0, -0.5, 2.0) \\
    & Slope    & 1450 & 1460 & (1.5, -2.0, -1.5, -1.0, -0.5, 0.0) \\
%\\
GR7 & Location & 2623 & 2622 & (1.5, -2.0, -1.5, -1.0, -0.5, 0.0, 2.0) \\
    & Slope    & 1163 & 1170 & (1.5, -2.0, -1.5, -1.0, -0.5, 0.0, 0.5) \\
%\\
GR8 & Location & 2494 & 2500 & (1.5, -2.0, -1.5, -1.0, -0.5, 0.0, 1.0, 2.0) \\
    & Slope    &  991 &  986 & (1.5, -2.0, -1.5, -1.0, -0.5, 0.0, 0.5, 1.0) \\
%\\
GR9 & Location & 2483 & 2481 & (1.5, -2.0, -1.5, -1.0, -0.5, 0.0, 0.5, 1.0, 2.0) \\
    & Slope    &  888 &  889 & (1.5, -2.0, -1.5, -1.0, -0.5, 0.0, 0.5, 1.0, 1.5) \\
%\\
%\hline \\
\bottomrule
%\multicolumn{5}{l}{\textit{Note.} Values of the MLE sample size are from Kim (2023).} \\
\end{tabular}
\begin{tablenotes}[hang]
\item [] \textit{Note.} Values of the MLE sample size are from Kim (2023).
\end{tablenotes}
%}
\end{table}


Shown in Table 1 are the sample sizes required to achieve one decimal place of accuracy for location and slope for the graded response model with two to nine categories (GR2--GR9) when slope is 1.5 and the location range $-2$ to $+2$ with increment of 0.5.
The posterior standard deviation of the order of 0.05 was considered for accuracy.
The sample sizes from maximum likelihood estimation were also reported in Table 1 based on Kim (2023).  
The standard error of the order of 0.05 was considered for accuracy.

The approximate sample sizes to achieve one decimal place of accuracy for parameters in the graded response model from Bayes modal estimation are based on the the results from the R code for GR2--GR9.
The sample sizes required to achieve one decimal place of accuracy for GR2 from Bayes modal estimation when slope is 1.5 and the location range $-2$ to $+2$ are 7493 for location and 8897 for slope.
The sample sizes required to achieve one decimal place of accuracy for GR2 from maximum likelihood estimation when slope is 1.5 and the location range $-2$ to $+2$ are 7500 for location and 8912 for slope.

The sample sizes required to achieve one decimal place of accuracy for GR3 from Bayes modal estimation when slope is 1.5 and the location range $-2$ to $+2$ are 4026 for location and 4640 for slope.
The sample sizes required to achieve one decimal place of accuracy for GR3 from maximum likelihood estimation when slope is 1.5 and the location range $-2$ to $+2$ are 4020 for location and 4652 for slope.

The required sample sizes are gradually reduced when the number of categories of the item increases.
Both Bayes modal estimation and maximum likelihood estimation are expected to use very large but nearly the same sample sizes for the one decimal place of accuracy of parameter estimates, respectively, assessed by the size of posterior standard deviations and the size of standard errors.


\begin{figure}[hbt!]
\includegraphics[width=.40\linewidth]{psdfigure1.eps} %\hfill
\includegraphics[width=.40\linewidth]{psdfigure2.eps} \\
\caption{%1. 
Bayes Modal Posterior Standard Deviations (PSDs) in Red and Maximum Likelihood Standard Errors (SEs) in Blue of Location (Left Figure) and Slope (Right Figure) for the Graded Response Model with Two Categories When Slope Is 1.5 with Sample Sizes of 100 and 1000}
\label{psdfigure1}
\end{figure}


Let us compare the posterior standard deviations and the standard errors of location for GR2 for two sample sizes ($N=100$ and $N=1000$) in order to get a better feel for the sample size issue and the estimation method issue.
Shown in Figure 1 are the Bayes modal posterior standard deviations and the maximum likelihood standard errors of location (i.e., left figure) and slope (i.e., right figure) for GR2 when slope is 1.5 which is a representative value for most serious testing applications.
In the left figure for a sample of 100 for the location range $-3$ to $+3$, the posterior standard deviations of location are smaller, sometimes trivially so in the middle of the range, than the standard errors of location.
For a sample size of 100 for the location range $-1$ to $+1$ both posterior standard deviations of location and standard errors of location are below of the order of 0.2.
For a sample of 1000 for the location range $-3$ to $+3$ the posterior standard deviations of location are the same as the standard errors of location.
For a sample of 1000 for the location range $-2.5$ to $+2.5$ both posterior standard deviations of location and standard errors of location are below of the order of 0.2.
As inferred from Table 1, for the sample size of 1000 both posterior standard deviations of location and standard errors of location are much larger than of the order of $0.05$ for the entire location range.

In the right figure for a sample of 100 for the location range $-3$ to $+3$, the posterior standard deviations of slope are smaller than the standard errors of location.
For a sample of 100 for the location range $-1$ to $+1$ both posterior standard deviations of slope and standard errors of slope are below of the order of 0.4.  
For a sample of 1000 for the location range $-3$ to $+3$ the posterior standard deviations of slope are the same as the standard errors of slope.
For a sample of 1000 for the location range $-2.5$ to $+2.5$ both posterior standard deviations of slope and standard errors of slope are below of the order of 0.2.
For a sample size of 1000 none of the posterior standard deviations of slope and the standard errors of slope are below of the order of 0.1.
As also inferred from Table 1, for the sample size of 1000 both posterior standard deviations of slope and standard errors of slope are much larger than of the order of $0.05$ for the entire location range.

It is disquieting to see in Figure 1 that adequate estimates of location or slope cannot be obtained with the sample of 1000 regardless of whether Bayes modal estimation or maximum likelihood estimation is used.
The sample size to achieve the one decimal accuracy of location or slope if the location range is extended to $-3$ and $+3$ would be more than 10000 which is as large a sample as plausible with only truly large scale assessment cases.


\begin{figure}[hbt]
\includegraphics[width=.40\linewidth]{psdfigure3.eps} %\hfill
\includegraphics[width=.40\linewidth]{psdfigure4.eps} \\
\includegraphics[width=.40\linewidth]{psdfigure7.eps} %\hfill
\includegraphics[width=.40\linewidth]{psdfigure8.eps} \\
%\vspace*{-.25in}
\caption{%2. %{\small 
The Posterior Standard Deviation of Location (Left Side) and Slope (Right Side) Shown as a Bivariate Function of Slope and Location for the Graded Response Model with Two Categories with Sample Size 100 (Top Figures) and 1000 (Bottom Figures)}
%}
\label{psdfigure2}
\end{figure}

\begin{figure}[hbt]  
\includegraphics[width=.40\linewidth]{psdfigure5.eps} %\hfill 
\includegraphics[width=.40\linewidth]{psdfigure6.eps} \hfill \\ 
\includegraphics[width=.40\linewidth]{psdfigure9.eps} %\hfill
\includegraphics[width=.40\linewidth]{psdfigure10.eps} \\
%\vspace*{-.25in}
\caption{%3. %{\small 
The Standard Error of Location (Left Side) and Slope (Right Side) Shown as a Bivariate Function of Slope and Location for the Graded Response Model with Two Categories with Sample Size 100 (Top Figures) and 1000 (Bottom Figures)}
%}
\label{psdfigure3}
\end{figure}


Let us examine three-dimensional plots in order to better understand the relationship that the slope and the location parameter for GR2 has with posterior standard deviation.
Shown in Figure 2 are the posterior standard deviations taken from Table 2 of location (i.e., top left figure) and slope (i.e., top right figure), respectively, for GR2 with a sample of 100.

The perspective plot in the top left figure, conditioned on each slope value, shows that the posterior standard deviation of location reaches its minimum at a point where location is 0 which is the center of the ability distribution.
All conditional functions of the posterior standard deviation of location are concave down with location 0 to have their minimum values.
The plot also shows that the posterior standard deviation of location gradually decreases as the value of slope increases, except for the two extreme location regions.

The perspective plot in the top right figure, conditioned on each location value, shows that the posterior standard deviation of slope sharply increases as the value of slope increases.
For relatively larger values of slope, the posterior standard deviation of slope reaches its minimum at a point where location is 0.
The magnitude of the posterior standard deviations of slope gets larger when its value is large and location is far away from the center of the ability distribution.  
Nevertheless all posterior standard deviations of slope reach their minimum when location is 0.

Shown also in Figure 2 are the posterior standard deviations taken from Table 3 of location (i.e., bottom left figure) and slope (i.e., bottom right figure), respectively, for GR2 with a sample of 1000.
The general sizes of the posterior standard deviations from the two bottom figure are much smaller than those from the two top figures.

The perspective plot in the bottom left figure, conditioned on each slope value, shows that the posterior standard deviation of location reaches its minimum at a point where location is 0 which is the center of the ability distribution.
All conditional functions of the posterior standard deviation of location are concave down with location 0 to have their minimum values.
The plot also shows that the posterior standard deviation of location gradually decreases as the value of slope increases.

The perspective plot in the bottom right figure, conditioned on each location value, shows that the posterior standard deviation of slope gradually increases as the value of slope increases.
For relatively larger values of slope, the posterior standard deviation of slope reaches its minimum at a point where location is 0.
The magnitude of the posterior standard deviations of slope gets larger when its value is large and location is far away from the center of the ability distribution.  
All posterior standard deviations of slope reach their minimum when location is 0, but such a pattern is not really noticeable for $a=0.5$.

In order to compare the posterior standard deviation from Bayes modal estimation and the standard errors from maximum likelihood estimation, let us examine three-dimensional plots in order to better understand the relationship that the slope and the location parameter for GR2 has with standard error.
Shown in Figures 3 are the standard errors taken from Table 4 of location (i.e., top left figure) and slope (top right figure) for GR2 with a sample of 100.

The perspective plot in the top left figure, conditioned on each slope value, shows that the standard error of location reaches its minimum at a point where location is 0 which is the center of the ability distribution.
All conditional functions of the standard error of location are concave down with location 0 to have their minimum values.
The plot also shows that the standard error of location gradually decreases as the value of slope increases.

The perspective plot in the top right figure, conditioned on each location value, shows that the standard error of slope gradually increases as the value of slope increases.
For relatively larger values of slope, the standard error of slope reaches its minimum at a point where location is 0.
The magnitude of the standard errors of slope gets larger when its value is large and location is far away from the center of the ability distribution.  
All standard errors of slope reach their minimum when location is 0, but such a pattern is not really noticeable for $a=0.5$.

Shown also in Figure 3 are the standard errors taken from Table 5 of location (i.e., bottom left figure) and slope (i.e., bottom right figure), respectively, for GR2 with a sample of 1000.
The general sizes of the standard errors from the two bottom figures are much smaller than those from the two top figures.

The perspective plot in the bottom left figure, conditioned on each slope value, shows that the standard error of location reaches its minimum at a point where location is 0 which is the center of the ability distribution.
All conditional functions of the standard error of location are concave down with location 0 to have their minimum values.
The plot also shows that the standard error of location gradually decreases as the value of slope increases.

The perspective plot in the bottom right figure, conditioned on each location value, shows that the standard error of slope gradually increases as the value of slope increases.
For relatively larger values of slope, the standard error of slope reaches its minimum at a point where location is 0.
The magnitude of the standard errors of slope gets larger when its value is large and location is far away from the center of the ability distribution.  
All standard errors of slope reach their minimum when location is 0, but such a pattern is not really noticeable for $a=0.5$.

Understanding the magnitudes of posterior standard deviations of location and slope as in Figure 2 and the magnitudes of standard errors of location and slope as in Figure 3 in GR2 is important because similar patterns are observed for other graded response model with more response categories, although the magnitudes get relatively smaller as the number of categories increases.
The posterior standard deviation of location and the standard error of location for GR2 when slope is 1.5 and location is 0 seems to provide the minimum value (i.e., the lower bound) for GR3--GR9 (n.b., trivially smaller values of posterior standard deviations of location and standard errors of location, respectively, might be observed).
The posterior standard deviations of slope and the standard errors of slope for GR2 for all corresponding points on the location range $-3$ to $+3$ seem to provide the maximum values for GR3--GR9 (i.e., the upper bounds).

Comparing the two top figures of Figures 2--3 reveals that the posterior standard deviations from large values of slope are relatively larger than the standard errors from the corresponding values of slope for a sample of 100.
For a sample of 100 the posterior standard deviations are relatively, trivially smaller than the standard errors if reasonable priors are employed (i.e., priors are matched with the respective parameters).
Figures 2--3 show, however, that practically the same precision measures are obtained for a sample of 1000.


\begin{figure}[hbt]
\includegraphics[width=.30\linewidth]{psdfigure11.eps} \hfill
\includegraphics[width=.30\linewidth]{psdfigure12.eps} \hfill
\includegraphics[width=.30\linewidth]{psdfigure13.eps} \\
\includegraphics[width=.30\linewidth]{psdfigure17.eps} \hfill
\includegraphics[width=.30\linewidth]{psdfigure18.eps} \hfill
\includegraphics[width=.30\linewidth]{psdfigure19.eps} \\
%\vspace*{-.25in}
\caption{%4. %{\small 
The Posterior Standard Deviation of Location 1 (Left Side), Location 2 (Middle), and Slope (Right Side) Shown as a Bivariate Function of Locaion 1 and Location 2 for the Graded Response Model with Three Categories When Slope is 1.5 with Sample Size 100 (Top Figures) and 1000 (Bottom Figures)}
%}
\label{psdfigure4}
\end{figure}

\begin{figure}[hbt]
\includegraphics[width=.30\linewidth]{psdfigure14.eps} \hfill
\includegraphics[width=.30\linewidth]{psdfigure15.eps} \hfill
\includegraphics[width=.30\linewidth]{psdfigure16.eps} \\
\includegraphics[width=.30\linewidth]{psdfigure20.eps} \hfill
\includegraphics[width=.30\linewidth]{psdfigure21.eps} \hfill
\includegraphics[width=.30\linewidth]{psdfigure22.eps} \\
%\vspace*{-.25in}
\caption{%5. %{\small 
The Standard Error of Location 1 (Left Side), Location 2 (Middle), and Slope (Right Side) Shown as a Bivariate Function of Locaion 1 and Location 2 for the Graded Response Model with Three Categories When Slope is 1.5 with Sample Size 100 (Top Figures) and 1000 (Bottom Figures)}
%}
\label{psdfigure5}
\end{figure}


Shown in Figure 4 are the posterior standard deviations taken from Table 6 of location 1 (i.e., top left figure), location 2 (i.e., top middle figure), and slope (i.e., top right figure), respectively, for GR3 when slope is 1.5 with a sample of 100.
Slope can be specified by any value from 0.25 to 3 with a sample of 100.
But proportionally similar plots can be obtained to the three top figures.

%The perspective plot in the top left figure with the slope value of 1.5, shows that the posterior %standard deviation of location 1 reaches its minimum at a point where location 1 is 0 which is %the center of the ability distribution.
%For all other cases where location 1 is not 0, the posterior standard deviation of location 1 %gets smaller at a point where location 2 is 0.
%Because the location parameters are ordered (i.e., $b_1 < b_2$) the plot looks half of the %concave down paraboloidal reflector.

%The perspective plot in the top middle figure with the slope value of 1.5, shows that the %posterior standard deviation of location 2 reaches its minimum at a point where location 2 is 0 %which is the center of the ability distribution.
%For all other cases where location 2 is not 0, the posterior standard deviation of location 2 %gets smaller at a point where location 1 is 0.
%Because the location parameters are ordered (i.e., $b_1 < b_2$) the plot looks half of the %concave down paraboloidal reflector.

%The perspective plot in the top right figure with the slope value of 1.5, shows that the %posterior standard deviation of slope reaches its minimum at a point where both location 1 and %location 2 are close to 0, but both locations are neither too close nor too separated (e.g., %location 1 is $-1$ and location 2 is $+1$).
%Because the location parameters are ordered (i.e., $b_1 < b_2$) the plot looks portions of the %concave down elliptic paraboloid surface.

Shown also in Figure 4 are the posterior standard deviations taken from Table 7 of location 1 (i.e., bottom left figure), location 2 (i.e., bottom middle figure), and slope (i.e., bottom right figure) for GR3 when slope is 1.5 with a sample of 1000.
Again, slope can be specified by any value from 0.25 to 3 with a sample of 1000.
But proportionally similar plots can be obtained to the three bottom figures.
The general sizes of the posterior standard deviations from the three bottom figures are much smaller than those from the three top figures.

%The perspective plot in the bottom left figure with the slope value of 1.5, shows that the %posterior standard deviation of location 1 reaches its minimum at a point where location 1 is 0 %which is the center of the ability distribution.
%For all other cases where location 1 is not 0, the posterior standard deviation of location 1 %gets smaller at a point where location 2 is 0.
%Because the location parameters are ordered (i.e., $b_1 < b_2$) the plot looks half of the %concave down paraboloidal reflector.

%The perspective plot in the bottom middle figure with the slope value of 1.5, shows that the %posterior standard deviation of location 2 reaches its minimum at a point where location 2 is 0 %which is the center of the ability distribution.
%For all other cases where location 2 is not 0, the posterior standard deviation of location 2 %gets smaller at a point where location 1 is 0.
%Because the location parameters are ordered (i.e., $b_1 < b_2$) the plot looks half of the %concave down paraboloidal reflector.

%The perspective plot in the bottom right figure with the slope value of 1.5, shows that the %posterior standard deviation of slope reaches its minimum at a point where both location 1 and %location 2 are close to 0, but both locations are neither too close nor too separated (e.g., %location 1 is $-1$ and location 2 is $+1$).
%Because the location parameters are ordered (i.e., $b_1 < b_2$) the plot looks portions of the %concave down elliptic paraboloid surface.

In order to compare the posterior standard deviation from Bayes modal estimation and the standard errors from maximum likelihood estimation, let us examine three-dimensional plots in order to better understand the relationship that the slope and the location parameter for GR3 has with standard error.

Shown in Figure 5 are the standard error taken from Table 8 of location 1 (i.e., bottom left figure), location 2 (i.e., bottom middle figure), and slope (i.e., bottom right figure), respectively, for GR3 when slope is 1.5 with a sample of 100.
Slope can be specified by any value from 0.25 to 3 with a sample of 100.
But proportionally similar plots can be obtained to the top three figures.

%The perspective plot in the top left figure with the slope value of 1.5, shows that the standard %error of location 1 reaches its minimum at a point where location 1 is 0 which is the center of %the ability distribution.
%For all other cases where location 1 is not 0, the standard error of location 1 gets smaller at a %point where location 2 is 0.
%Because the location parameters are ordered (i.e., $b_1 < b_2$) the plot looks half of the %concave down paraboloidal reflector.

%The perspective plot in the top middle figure with the slope value of 1.5, shows that the %standard error of location 2 reaches its minimum at a point where location 2 is 0 which is the %center of the ability distribution.
%For all other cases where location 2 is not 0, the standard error of location 2 gets smaller at a %point where location 1 is 0.
%Because the location parameters are ordered (i.e., $b_1 < b_2$) the plot looks half of the %concave down paraboloidal reflector.

%The perspective plot in the top right figure with the slope value of 1.5, shows that the standard %error of slope reaches its minimum at a point where both location 1 and location 2 are close to %0, but both locations are neither too close nor too separated (e.g., location 1 is $-1$ and %location 2 is $+1$).
%Because the location parameters are ordered (i.e., $b_1 < b_2$) the plot looks portions of the %concave down elliptic paraboloid surface.

Shown in also Figure 5 are the standard error taken from Table 9 of location 1 (i.e., top left figure), location 2 (i.e., top middle figure), and slope (i.e., top right figure) for GR3 when slope is 1.5 with a sample of 1000.
Again, slope can be specified by any value from 0.25 to 3 with a sample of 1000.
But proportionally similar plots can be obtained to the three bottom figures.
The general sizes of the posterior standard deviations from the three top figures are much smaller than those from the the three top figures.

%The perspective plot in the bottom left figure with the slope value of 1.5, shows that the %standard error of location 1 reaches its minimum at a point where location 1 is 0 which is the %center of the ability distribution.
%For all other cases where location 1 is not 0, the standard error of location 1 gets smaller at a %point where location 2 is 0.
%Because the location parameters are ordered (i.e., $b_1 < b_2$) the plot looks half of the %concave down paraboloidal reflector.

%The perspective plot in the bottom middle figure with the slope value of 1.5, shows that the %standard error of location 2 reaches its minimum at a point where location 2 is 0 which is the %center of the ability distribution.
%For all other cases where location 2 is not 0, the standard error of location 2 gets smaller at a %point where location 1 is 0.
%Because the location parameters are ordered (i.e., $b_1 < b_2$) the plot looks half of the %concave down paraboloidal reflector.

%The perspective plot in the bottom right figure with the slope value of 1.5, shows that the  %standard error of slope reaches its minimum at a point where both location 1 and location 2 are %close to 0, but both locations are neither too close nor too separated (e.g., location 1 is $-1$ %and location 2 is $+1$).
%Because the location parameters are ordered (i.e., $b_1 < b_2$) the plot looks portions of the %concave down elliptic paraboloid surface.

Figures 4--5 show that practically the same precision measures for location and slope are obtained for a sample of 100 as well as for a sample of 1000.
Note that the value for the slope is 1.5 in Figures 4--5 as well as Tables 6--9. 

Similar plots to that in Figure 4 for a sample of 100 and for a sample of 1000 for the posterior standard deviations as well as 
similar plots in that in Figure 5 for a sample of 100 and for a sample of 1000 for the standard errors may be constructed for GR4 and beyond.

For an example, a table can be obtained for GR4 for the posterior standard deviations of location 1, location 2, location 3, and slope with a sample of 100. 
Again, for brevity as in GR3, the value of slope can be fixed as 1.5. 
In addition, location 1 can be fixed as $-3$ in order to obtain such a table.
Another table can be obtained for the posterior standard deviation of location 1, location 2, location 3, and slope with a sample of 1000.
Again slope can be fixed as 1.5 and location 1 can also be fixed as $-3$ in order to obtain such a table.
From the two tables, perspective plots and be constructed to make, say Figure 6 (n.b., not actually created).
The x-dimension of each perspective plot designates the values of location 2 from the range $-2.5$ to $+2.5$, and the y-dimension designates the values of location 3 from the range $-2$ to $+3$.
There would be four plots, that is, one for each parameter for GR4 for a sample of 100.
A similar four perspective plots can be constructed for a sample of 1000.

Using the same logic, two tables can be construction for GR4 for the standard errors of location 1, location 2, location 3, and slope with a sample of 100 and with a sample of 1000, respectively.
From the two tables, a total of eight perspective plots of standard errors can be constructed and combined to yield, say Figure 7 (n.b., not actually created).

We may find that the same general structure would continue to hold for the posterior standard deviations and the standard errors.
As locations became close to 0 which is the center of the ability distribution, the posterior standard deviations of location and the standard errors of location get smaller.  
As locations became far away from 0 the posterior standard deviations of location and the standard errors of location get larger. 
Similar patterns would be observed for the posterior standard deviations of slope and the standard errors of slope.
In addition, as slopes became more gradual in size, the posterior standard deviations of slope and the standard errors of slope get larger.
As the number of locations increased the posterior standard deviations of slope and the standard errors of slope get smaller.

One coherent finding from the examination of the tables and figures is that the use of either Bayes modal estimation or maximum likelihood estimation for location and for slope of the graded response model yields results too inexact to be of practical use for a sample size less than, say, 2500.
Both methods of estimation require samples of enormous size, especially for location beyond $\pm 2$ the ability range so as to make it prohibitively expensive in terms of data collection.
This problem arises for items with locations away from the center of the ability distribution. 
When an item has adjacent categories in extreme ends relatively not endorsed, selected, or assigned, there are few observations available to estimate the location parameters thus making the accompanied posterior standard deviations as well as the standard errors very large.


\section{Discussion}
Many different forms of priors (e.g., empirical, hierarchical, and multivariate normal) have been suggested in Bayesian inference for parameters in item response category functions of the graded response model (see Kim, 2024).  
Priors having different
forms can certainly be used to estimate item parameters and to obtain approximate posterior standard deviations in Bayes modal estimation.  
In such a case we should obtain a different set of partial derivatives of the log priors.

Although the distributional forms of priors are the same as those used in this study, different prior parameters (i.e., hyperparameters) can be used in calculation of approximate posterior standard deviations.  
When the forms of priors are the same as ones presented earlier, the accompanying R code can be used to obtain approximate posterior standard deviations using various combinations of priors (e.g., lognormal for slope and uninformative uniform for location by commenting out the location portions of R code) and their parameter specifications.  
In this sense, attention should be given not only to the selection of the functional forms of priors but also to the values of prior parameters when a Bayesian approach is
used.

There remain some issues for future research related to this paper and use of Bayesian inference in IRT.  
Some examples are 
prior forms and specifications, 
robustness, 
model selection, and 
posterior intervals.  
When using a reasonable sample size to calibrate items, however, it seems unlikely that totally different or incomparable results of item parameter estimates and variability measures will be obtained from different estimation methods.


%\section{Conclusion}
%The conclusion text goes here.


%\begin{acknowledgement}
%Insert the Acknowledgment text here.
%\end{acknowledgement}

%\paragraph{Funding Statement}

%This research was supported by grants from the <funder-name> <doi> (<award ID>); <funder-name> %<doi> (<award ID>).

%\paragraph{Competing Interests}

%A statement about any financial, professional, contractual or personal relationships or %situations that could be perceived to impact the presentation of the work --- or `None' if none %exist.


%\endnote in some journals will behave like \footnote; and \printendnotes will not output anything. 
%\printendnotes

%\printbibliography

\section*{References}
\begin{description}

\item  
Baker, F.~B. (1992).  
\textit{Item response theory: Parameter estimation techniques.} 
New York:\ Dekker.

\item
Berger, J.~O. (1985).  
{\it Statistical decision theory and Bayesian analysis} (2nd ed.).  
New York:\ Springer-Verlag.

\item  
du Toit, M. (Ed.). (2003).  
\textit{IRT from SSI.}
Lincolnwood, IL:\ Scientific Software International.

\item
Hogg, R.~V., \& Craig, A.~T. (1978).  
\textit{Introduction to mathematical statistics} (4th ed.).  
New York:\ Macmillan.

\item 
Houts, C.\ R., \& Cai, L. (2013).
\textit{flexMIRT user's manual version 2.}
Chapel Hill, NC:\ Vector Psychometric Group.

\item 
Kim, S.-H. (2007).
Some posterior standard deviations in item response theory.
\textit{Educational and Psychological Measurement, 67}(2), 258-279.

\item 
Kim, S.-H. (2023).
\textit{Some standard errors of the graded response model}
[Manuscript submitted for publication].
Department of Educational Psychology, University of Georgia.

\item 
Kim, S.-H. (2024).
Priors in Bayesian estimation under the graded response model. 
In M.\ Wiberg, J.-S.\ Kim, H.\ Hwang, H.\ Wu, \& T.\ Sweet (Eds.),
\textit{Quantitative psychology research} (pp.\ 13--23).  
Cham, Switzerland:\ Springer.

\item
Mislevy, R.~J. (1986).  
Bayes modal estimation in item response models. 
{\it Psychometrika, 51,} 177--195.

\item 
Muraki, E., \& Bock, R.\ D. (1993).
\textit{PARSCALE:\ IRT based test scoring and item analysis for graded open-ended exercises and performance tasks.} 
Chicago, IL:\ Scientific Software International.

\item 
Muraki, E., \& Bock, R.\ D. (2002).
\textit{PARSCALE:\ IRT based test scoring and item analysis for graded open-ended exercises and performance tasks.} 
Lincolnwood, IL:\ Scientific Software International.

\item 
Samejima, F. (1969).
Estimation of latent ability using a response pattern of graded scores.
\textit{Psychometrika Monograph Supplement,} No.\ 17.

\item 
Samejima, F. (1972).
A general model for free-response data.
\textit{Psychometrika Monograph Supplement,} No.\ 18.

\item
Thissen, D. (1991).  
MULTILOG user's guide:\ Multiple, categorical item analysis and test scoring using item response theory [Computer software].  
Chicago:\ Scientific Software.

\item  
Thissen, D., Chen, W.-H., \& Bock, R.~D. (2002).  
MULTILOG [Computer software]. 
Lincolnwood, IL:\ Scientific Software International.

\item
Thissen, D., \& Wainer, H. (1982).  
Some standard errors in item response theory.  
{\it Psychometrika, 47,} 397--412.

\item
Tsutakawa, R.~K., \& Johnson, J.~C. (1990). 
The effect of uncertainly of item parameter estimation on ability estimates.
{\it Psychometrika, 55,} 371--390.

\end{description}

%\appendix

%\section{Example Appendix Section}

%Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut %labore et dolore magna aliqua. Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do %eiusmod tempor incididunt ut labore et dolore magna aliqua. Lorem ipsum dolor sit amet, %consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. 

\end{document}