<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article article-type="research-article" dtd-version="1.1d3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">plosone</journal-id>
<journal-title-group>
<journal-title>PLOS ONE</journal-title>
</journal-title-group>
<issn pub-type="epub">1932-6203</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, CA USA</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.1371/journal.pone.0299947</article-id>
<article-id pub-id-type="publisher-id">PONE-D-21-24168</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Research Article</subject>
</subj-group>
<subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Oral medicine</subject><subj-group><subject>Oral health</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Medical conditions</subject><subj-group><subject>Infectious diseases</subject><subj-group><subject>Bacterial diseases</subject><subj-group><subject>Caries</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Physical sciences</subject><subj-group><subject>Mathematics</subject><subj-group><subject>Applied mathematics</subject><subj-group><subject>Algorithms</subject><subj-group><subject>Machine learning algorithms</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Research and analysis methods</subject><subj-group><subject>Simulation and modeling</subject><subj-group><subject>Algorithms</subject><subj-group><subject>Machine learning algorithms</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Computer and information sciences</subject><subj-group><subject>Artificial intelligence</subject><subj-group><subject>Machine learning</subject><subj-group><subject>Machine learning algorithms</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>People and places</subject><subj-group><subject>Population groupings</subject><subj-group><subject>Age groups</subject><subj-group><subject>Children</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>People and places</subject><subj-group><subject>Population groupings</subject><subj-group><subject>Families</subject><subj-group><subject>Children</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Anatomy</subject><subj-group><subject>Digestive system</subject><subj-group><subject>Teeth</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Anatomy</subject><subj-group><subject>Digestive system</subject><subj-group><subject>Teeth</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Anatomy</subject><subj-group><subject>Head</subject><subj-group><subject>Jaw</subject><subj-group><subject>Teeth</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Anatomy</subject><subj-group><subject>Head</subject><subj-group><subject>Jaw</subject><subj-group><subject>Teeth</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Anatomy</subject><subj-group><subject>Digestive system</subject><subj-group><subject>Mouth</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Anatomy</subject><subj-group><subject>Digestive system</subject><subj-group><subject>Mouth</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Clinical medicine</subject><subj-group><subject>Signs and symptoms</subject><subj-group><subject>Pain</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Computer and information sciences</subject><subj-group><subject>Artificial intelligence</subject><subj-group><subject>Machine learning</subject></subj-group></subj-group></subj-group></article-categories>
<title-group>
<article-title>Development of short forms for screening children’s dental caries and urgent treatment needs using item response theory and machine learning methods</article-title>
<alt-title alt-title-type="running-head">Short forms for children’s oral health assessment using item response theory and machine learning methods</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0001-5502-1464</contrib-id>
<name name-style="western">
<surname>Xiong</surname>
<given-names>Di</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="http://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="http://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role content-type="http://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role content-type="http://credit.niso.org/contributor-roles/software/">Software</role>
<role content-type="http://credit.niso.org/contributor-roles/validation/">Validation</role>
<role content-type="http://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-original-draft/">Writing – original draft</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Marcus</surname>
<given-names>Marvin</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="http://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role content-type="http://credit.niso.org/contributor-roles/resources/">Resources</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-original-draft/">Writing – original draft</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Maida</surname>
<given-names>Carl A.</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="http://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role content-type="http://credit.niso.org/contributor-roles/resources/">Resources</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-original-draft/">Writing – original draft</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Lyu</surname>
<given-names>Yuetong</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/software/">Software</role>
<role content-type="http://credit.niso.org/contributor-roles/validation/">Validation</role>
<role content-type="http://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0001-6697-907X</contrib-id>
<name name-style="western">
<surname>Hays</surname>
<given-names>Ron D.</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff005"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0002-4822-6514</contrib-id>
<name name-style="western">
<surname>Wang</surname>
<given-names>Yan</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Shen</surname>
<given-names>Jie</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Spolsky</surname>
<given-names>Vladimir W.</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Lee</surname>
<given-names>Steve Y.</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/resources/">Resources</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff006"><sup>6</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Crall</surname>
<given-names>James J.</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/resources/">Resources</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<name name-style="western">
<surname>Liu</surname>
<given-names>Honghu</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="http://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="http://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role content-type="http://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role content-type="http://credit.niso.org/contributor-roles/resources/">Resources</role>
<role content-type="http://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-original-draft/">Writing – original draft</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
</contrib-group>
<aff id="aff001"><label>1</label> <addr-line>Section of Public and Population Health, Division of Oral and Systemic Health Sciences, School of Dentistry, University of California, Los Angeles, Los Angeles, California, United States of America</addr-line></aff>
<aff id="aff002"><label>2</label> <addr-line>Department of Biostatistics, Fielding School of Public Health, University of California, Los Angeles, Los Angeles, California, United States of America</addr-line></aff>
<aff id="aff003"><label>3</label> <addr-line>Division of General Internal Medicine and Health Services Research, Department of Medicine, David Geffen School of Medicine, University of California, Los Angeles, Los Angeles, California, United States of America</addr-line></aff>
<aff id="aff004"><label>4</label> <addr-line>Department of Health Policy and Management, Fielding School of Public Health, University of California, Los Angeles, Los Angeles, California, United States of America</addr-line></aff>
<aff id="aff005"><label>5</label> <addr-line>RAND Corporation, Santa Monica, California, United States of America</addr-line></aff>
<aff id="aff006"><label>6</label> <addr-line>Sectopm of Interdisciplinary Dentistry, Division of Diagnostic and Surgical Sciences, School of Dentistry, University of California, Los Angeles, Los Angeles, California, United States of America</addr-line></aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple">
<name name-style="western">
<surname>Cilar Budler</surname>
<given-names>Leona</given-names>
</name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/>
</contrib>
</contrib-group>
<aff id="edit1"><addr-line>University of Maribor, SLOVENIA</addr-line></aff>
<author-notes>
<fn fn-type="conflict" id="coi001">
<p>The authors have declared that no competing interests exist.</p>
</fn>
<corresp id="cor001">* E-mail: <email xlink:type="simple">hhliu@dentistry.ucla.edu</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>22</day>
<month>3</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>19</volume>
<issue>3</issue>
<elocation-id>e0299947</elocation-id>
<history>
<date date-type="received">
<day>26</day>
<month>7</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>2</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-year>2024</copyright-year>
<copyright-holder>Xiong et al</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.1371/journal.pone.0299947"/>
<abstract>
<sec id="sec001">
<title>Objectives</title>
<p>Surveys can assist in screening oral diseases in populations to enhance the early detection of disease and intervention strategies for children in need. This paper aims to develop short forms of child-report and proxy-report survey screening instruments for active dental caries and urgent treatment needs in school-age children.</p>
</sec>
<sec id="sec002">
<title>Methods</title>
<p>This cross-sectional study recruited 497 distinct dyads of children aged 8–17 and their parents between 2015 to 2019 from 14 dental clinics and private practices in Los Angeles County. We evaluated responses to 88 child-reported and 64 proxy-reported oral health questions to select and calibrate short forms using Item Response Theory. Seven classical Machine Learning algorithms were employed to predict children’s active caries and urgent treatment needs using the short forms together with family demographic variables. The candidate algorithms include CatBoost, Logistic Regression, K-Nearest Neighbors (KNN), Naïve Bayes, Neural Network, Random Forest, and Support Vector Machine. Predictive performance was assessed using repeated 5-fold nested cross-validations.</p>
</sec>
<sec id="sec003">
<title>Results</title>
<p>We developed and calibrated four ten-item short forms. Naïve Bayes outperformed other algorithms with the highest median of cross-validated area under the ROC curve. The means of best testing sensitivities and specificities using both child-reported and proxy-reported responses were 0.84 and 0.30 for active caries, and 0.81 and 0.31 for urgent treatment needs respectively. Models incorporating both response types showed a slightly higher predictive accuracy than those relying on either child-reported or proxy-reported responses.</p>
</sec>
<sec id="sec004">
<title>Conclusions</title>
<p>The combination of Item Response Theory and Machine Learning algorithms yielded potentially useful screening instruments for both active caries and urgent treatment needs of children. The survey screening approach is relatively cost-effective and convenient when dealing with oral health assessment in large populations. Future studies are needed to further leverage the customize and refine the instruments based on the estimated item characteristics for specific subgroups of the populations to enhance predictive accuracy.</p>
</sec>
</abstract>
<funding-group>
<award-group id="award001">
<funding-source>
<institution-wrap>
<institution-id institution-id-type="funder-id">http://dx.doi.org/10.13039/100000072</institution-id>
<institution>national institute of dental and craniofacial research</institution>
</institution-wrap>
</funding-source>
<award-id>U01DE022648</award-id>
</award-group>
<award-group id="award002">
<funding-source>
<institution-wrap>
<institution-id institution-id-type="funder-id">http://dx.doi.org/10.13039/100000072</institution-id>
<institution>national institute of dental and craniofacial research</institution>
</institution-wrap>
</funding-source>
<award-id>U01DE029491</award-id>
</award-group>
<award-group id="award003">
<funding-source>
<institution-wrap>
<institution-id institution-id-type="funder-id">http://dx.doi.org/10.13039/100000025</institution-id>
<institution>national institute of mental health</institution>
</institution-wrap>
</funding-source>
<award-id>T32MH080634</award-id>
<principal-award-recipient>
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0002-4822-6514</contrib-id>
<name name-style="western">
<surname>Wang</surname>
<given-names>Yan</given-names>
</name>
</principal-award-recipient>
</award-group>
<funding-statement>This study was funded by two NIDCR/NIH (National Institute of Dental and Craniofacial Research/ National Institute of Health, <ext-link ext-link-type="uri" xlink:href="https://www.nidcr.nih.gov/" xlink:type="simple">https://www.nidcr.nih.gov/</ext-link>) grants to the University of California, Los Angeles (UCLA) (U01DE022648 and U01DE029491). Y. Wang was supported by the NIMH/NIH award T32MH080634. The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement>
</funding-group>
<counts>
<fig-count count="1"/>
<table-count count="4"/>
<page-count count="18"/>
</counts>
<custom-meta-group>
<custom-meta id="data-availability">
<meta-name>Data Availability</meta-name>
<meta-value>The datasets analyzed in this study are not publicly available because it contains potentially identifying and sensitive patient information related to children's health. Researchers may approach the corresponding author (<email xlink:type="simple">hhliu@dentistry.ucla.edu</email>) and IRB (<email xlink:type="simple">MIRB@research.ucla.edu</email>) to submit an IRB application for requesting de-identified data. Requests should include a specific analysis plan. All aggregated data and questionnaires are included within the manuscript and its supporting files. Codes are available at <ext-link ext-link-type="uri" xlink:href="https://github.com/dixiong777/COH_SF_IRTML" xlink:type="simple">https://github.com/dixiong777/COH_SF_IRTML</ext-link>.</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="sec005" sec-type="intro">
<title>1. Introduction</title>
<p>Early detection and intervention to prevent dental caries, the most common chronic disease of childhood [<xref ref-type="bibr" rid="pone.0299947.ref001">1</xref>], is critically important. In <italic>Savage Inequalities</italic>, Kozol noted that “Bleeding gums, impacted and rotting teeth are routine matters for the children I have interviewed in the South Bronx. The children get used to feeling constant pain” [<xref ref-type="bibr" rid="pone.0299947.ref002">2</xref>]. A recent study found that children with poor oral health status were three times more likely to miss school because of dental pain, with associated poorer school performance than their peers with better oral health [<xref ref-type="bibr" rid="pone.0299947.ref003">3</xref>]. Resource constraints substantially limit the feasibility of conducting traditional oral health examinations, especially for school-aged populations. The COVID-19 pandemic exacerbated the already limited access to school health education, nutritional support, and regular dental care [<xref ref-type="bibr" rid="pone.0299947.ref004">4</xref>, <xref ref-type="bibr" rid="pone.0299947.ref005">5</xref>].</p>
<p>Rather than intervening in the destructive process of dental disease, it is more cost-effective to identify dental disease early and address urgent problems. Survey instruments have been developed to assess children’s oral health problems such as the Child Oral Impact on Daily Performances (Child-OIDP) [<xref ref-type="bibr" rid="pone.0299947.ref006">6</xref>], Early Childhood Oral Health Impact Scale (ECOHIS) [<xref ref-type="bibr" rid="pone.0299947.ref007">7</xref>], and the Child Perceptions Questionnaire (CPQ) [<xref ref-type="bibr" rid="pone.0299947.ref008">8</xref>, <xref ref-type="bibr" rid="pone.0299947.ref009">9</xref>]. But these existing surveys focus on the oral health related quality-of-life impacts rather than on treatment referral recommendations. An instrument is needed that is accurate in identifying children who need treatment and at risk of long-term oral health problems.</p>
<p>Item response theory (IRT) is useful in identifying a parsimonious set of survey items with acceptable psychometric properties [<xref ref-type="bibr" rid="pone.0299947.ref010">10</xref>–<xref ref-type="bibr" rid="pone.0299947.ref013">13</xref>]. It has been widely used in education assessments [<xref ref-type="bibr" rid="pone.0299947.ref014">14</xref>], psychological tests [<xref ref-type="bibr" rid="pone.0299947.ref015">15</xref>], and health outcome measurements [<xref ref-type="bibr" rid="pone.0299947.ref016">16</xref>]. IRT models maximize the likelihood of the individual response pattern to estimate the item characteristics and the individual’s latent trait. Such item- and individual- information are crucial to understanding the survey performance and developing well-calibrated short forms. These item characteristic estimations also benefit further survey refinement, regardless of the number of item responses [<xref ref-type="bibr" rid="pone.0299947.ref017">17</xref>–<xref ref-type="bibr" rid="pone.0299947.ref019">19</xref>].</p>
<p>Machine Learning, on the other hand, is a data-centric approach to develop predictive and computationally efficient models. It has been used in dental research for disease identification [<xref ref-type="bibr" rid="pone.0299947.ref020">20</xref>, <xref ref-type="bibr" rid="pone.0299947.ref021">21</xref>], image diagnosis [<xref ref-type="bibr" rid="pone.0299947.ref022">22</xref>], dental care and dental surgery needs [<xref ref-type="bibr" rid="pone.0299947.ref023">23</xref>]. A collection of classical Machine Learning algorithms have demonstrated value for classification and prediction. Similarly, as a regression model, other Machine Learning algorithms classify or predict outcomes based on predictors. These algorithms are designed under various principles or mechanisms, including tree-based methods (like CatBoost [<xref ref-type="bibr" rid="pone.0299947.ref024">24</xref>] and Random Forest [<xref ref-type="bibr" rid="pone.0299947.ref025">25</xref>]), probability-based methods (like Logistic Regression and Naïve Bayes), distance-based methods (like K-Nearest Neighbor [<xref ref-type="bibr" rid="pone.0299947.ref025">25</xref>] and Support Vector Machine [<xref ref-type="bibr" rid="pone.0299947.ref026">26</xref>]) and more complex Neural Networks [<xref ref-type="bibr" rid="pone.0299947.ref027">27</xref>]. Machine learning has also been used to select optimal subsets of survey items [<xref ref-type="bibr" rid="pone.0299947.ref028">28</xref>–<xref ref-type="bibr" rid="pone.0299947.ref031">31</xref>]. However, they can introduce selection bias and lead to overfitting issues due to selection primarily limiting targeted outcomes [<xref ref-type="bibr" rid="pone.0299947.ref011">11</xref>]. The best-performing subset identified by IRT is comparable to those selected using Machine Learning in terms of prediction power [<xref ref-type="bibr" rid="pone.0299947.ref011">11</xref>].</p>
<p>Prior work focused on the development of short forms associated with the Children’s Oral Health Status Index and referral recommendations based on Child Self-Reported Outcomes (CSROs) and Parent Proxy-Reported Outcomes (PPROs) using IRT [<xref ref-type="bibr" rid="pone.0299947.ref032">32</xref>, <xref ref-type="bibr" rid="pone.0299947.ref033">33</xref>]. In addition, demographic information has been used in addition to short-form items to improve predictive performance using XGBoost and Naïve Bayes [<xref ref-type="bibr" rid="pone.0299947.ref028">28</xref>]. Dental caries among children has also been predicted using a Multivariate Adaptive Regression Spline [<xref ref-type="bibr" rid="pone.0299947.ref034">34</xref>]. None of this prior work used machine learning and IRT in combination to identify the best set of survey items.</p>
<p>Our work aims to fully utilize and synergize the strengths of IRT and Machine Learning to develop well-calibrated and efficient survey instruments for screening active caries and urgent treatment needs in school-age populations. Parsimonious instruments can be distributed by schools to facilitate routine oral health screenings for a quick evaluation of dental caries and treatment needs. Public health agencies and dental programs can use these short forms to monitor children’s oral health conditions and identify those at high risk regularly.</p>
</sec>
<sec id="sec006" sec-type="materials|methods">
<title>2. Methods</title>
<sec id="sec007">
<title>2.1. Source of data and participants</title>
<p>Our sample consisted of 497 dyads of children ages 8 to 17 and their parents. Families were recruited from 14 dental clinics and private practices across Los Angeles County in a cross-section study from August 2015 to October 2019. The participating sites provided dental care to children from low-to-high-income communities with a broad ethnic-racial diversity. The sample size was determined by using the standard error around a correlation which was approximately 0.045 [<xref ref-type="bibr" rid="pone.0299947.ref035">35</xref>] and was about sufficient for estimating the item response theory models [<xref ref-type="bibr" rid="pone.0299947.ref019">19</xref>].</p>
<p>The study excluded children who were in orthodontic treatment to avoid complexities and bias in performing tooth-based exam assessments. Only one child and parent per family was included. No specific treatments were administered during the study by the research team. However, children identified with additional dental care needs were referred to the clinics for evaluation and follow-up.</p>
<p>Institutional review board approval (#13–00130) was obtained from the Office of Human Research Protection Program, University of California, Los Angeles. Children and their parents signed written assent/consent forms before participating in the study.</p>
</sec>
<sec id="sec008">
<title>2.2. Outcomes</title>
<p>All children received a dental examination to evaluate their clinical oral health status. Two experienced faculty dentists from UCLA Dental School performed the examinations following a Children’s Oral Health Protocol consisting of examinations on the overall occlusal condition and teeth status. Each primary and/or permanent tooth was recorded as being sound, decayed, missing, filled, bleeding, and with sealant.</p>
<p>The examiners conducted duplicated examinations on three students at each participating site. A total of 52 children were examined by both examiners on the same visit date to check the inter-rater reliability. The agreement was high using both Prevalence-Adjusted and Bias-Adjusted Kappa (0.77 for active caries and 0.8 for urgent treatment need) and Gwet’s AC1 (0.86 for active caries and 0.81 for urgent treatment need) [<xref ref-type="bibr" rid="pone.0299947.ref036">36</xref>, <xref ref-type="bibr" rid="pone.0299947.ref037">37</xref>].</p>
<p>The clinical measures serve as the gold standard for calibration and evaluation of the oral health survey items. We focus on two dichotomous outcomes: whether the child 1) had at least one tooth with active caries (AC &gt; 0) and 2) was in need for a dental reference and service (RFUTN). RFUTN was assigned using modified guidance from the National Health and Nutrition Examination Survey to focus on the severity of untreated decay, gingival bleeding (more than twelve teeth), and missing teeth due to caries [<xref ref-type="bibr" rid="pone.0299947.ref038">38</xref>].</p>
</sec>
<sec id="sec009">
<title>2.3. Predictors</title>
<p>Before the clinical examinations of children, both children and their parents independently completed a self-administered computer-assisted survey about children’s oral health. The survey instrument was administered using the Questionnaire Development System, QDS<sup>™</sup>, (Nova Research Company, Bethesda, MD, USA) at the study clinics. Participants were required to answer all survey questions, resulting in complete data for this study with no missing responses.</p>
<p>Oral health survey items encompassed physical, mental, and social components based on a conceptual framework that reflected the complex nature of oral health [<xref ref-type="bibr" rid="pone.0299947.ref032">32</xref>, <xref ref-type="bibr" rid="pone.0299947.ref033">33</xref>]. The survey assessed multiple aspects of children’s previous and current oral health status and behaviors such as overall oral health rating, teeth conditions, pain status, aesthetic, function limitations, experience recall (e.g., for the past 12 months, 4 weeks, 7 days, and 3 days), dental support, and so on (see <xref ref-type="supplementary-material" rid="pone.0299947.s001">S1 Data</xref> for the full list of items). Eighty-eight items for children and sixty-four items for parents were used for the analyses reported here. Demographic information was obtained using six child-reported and nine parent-reported items. The survey development process including focus groups, cognitive interviews, and full-item banks is discussed elsewhere [<xref ref-type="bibr" rid="pone.0299947.ref032">32</xref>, <xref ref-type="bibr" rid="pone.0299947.ref035">35</xref>, <xref ref-type="bibr" rid="pone.0299947.ref039">39</xref>]. In this paper, CSROs refer to Child Self-Reported Outcomes and PPROs for Parent Proxy-Reported Outcomes for better model labeling and comparison.</p>
</sec>
<sec id="sec010">
<title>2.4. Statistical analysis methods</title>
<sec id="sec011">
<title>2.4.1. Data preparation</title>
<p>CSRO and PPRO items associated with children’s oral health were rescaled into 0 to 5 with a higher score indicating worse oral health status, reflecting a higher likelihood of having a tooth with active caries and needing urgent dental care. If three or fewer responses were obtained for a response option, we collapsed this category with the adjacent higher-level option which represented a poorer oral health status. The full set of options was administered, but the collapsed options were used to estimate risk scores and make predictions. Highly right-skewed (positive skewness) items, as evidence of poor fit between the health status of the sample and the level of health measured by an item, were excluded [<xref ref-type="bibr" rid="pone.0299947.ref040">40</xref>]. Items that were positively and significantly associated (p-value &lt; = 0.05 and r &gt; = 0) or had at least a polychoric correlation &gt; = 0.20 with the two clinical outcomes, the presence of active caries and urgent treatment needs, were further investigated to develop short forms.</p>
</sec>
<sec id="sec012">
<title>2.4.2. IRT assumptions</title>
<p>We first developed short forms using Samejima’s graded response model that estimates item thresholds and slope parameters for each ordered survey response item [<xref ref-type="bibr" rid="pone.0299947.ref041">41</xref>]. The item thresholds represent the trait level necessary to respond above threshold with a 50% chance of selecting a particular response option or a higher response option. A slope parameter represents the capability of this item to discriminate between contiguous latent trait levels. Before implementing the model, we evaluated the assumptions of “sufficient” unidimensionality, local independence, and monotonicity.</p>
<p>Unidimensionality indicates that the response to an item is accountable by one dominant latent trait. It can be assessed by single-factor confirmatory factor analysis (CFA) [<xref ref-type="bibr" rid="pone.0299947.ref042">42</xref>] using the checking comparative fit index (CFI &gt; 0.95), Tucker-Lewis Index (TLI &gt; 0.90), and the Root Mean Square Error of Approximation (RMSEA &lt; 0.06) [<xref ref-type="bibr" rid="pone.0299947.ref043">43</xref>, <xref ref-type="bibr" rid="pone.0299947.ref044">44</xref>]. CFA was conducted using an R package <italic>Lavaan</italic> [<xref ref-type="bibr" rid="pone.0299947.ref045">45</xref>] with polychoric correlations and the Mean- and Variance- Adjusted Weighted Least Square (WLSMV) robust estimations [<xref ref-type="bibr" rid="pone.0299947.ref045">45</xref>]. WLSMV estimations are more appropriate than maximum likelihood estimations for binary and ordinal variables [<xref ref-type="bibr" rid="pone.0299947.ref046">46</xref>, <xref ref-type="bibr" rid="pone.0299947.ref047">47</xref>].</p>
<p>Local independence requires that the item responses are mutually independent when controlling for the underlying latent variable. For any pair of items with a residual correlation absolute value of 0.20 or higher in the single-factor CFA, the item with higher accumulated residual correlations was eliminated [<xref ref-type="bibr" rid="pone.0299947.ref040">40</xref>].</p>
<p>The monotonicity was evaluated by item characteristics curves to ensure the probability of endorsing a more severe response option should increase monotonically with the latent trait scores, such as the likelihood of active caries and RFUTN in this study.</p>
</sec>
<sec id="sec013">
<title>2.4.3. IRT calibration and differential item functioning analysis</title>
<p>IRT models were estimated using Mplus 8.3 [<xref ref-type="bibr" rid="pone.0299947.ref048">48</xref>] to obtain item thresholds and slopes and for maximum likelihood estimations of each child’s location on the underlying score continuum. The thresholds, or item difficulty, refer to the point on the latent trait scale at which there is a 50% chance of responding at or above a certain response level for each item; while the slop, or item discrimination, measures the ability of an item to differentiate between children with varying levels of oral health conditions.</p>
<p>Differential Item Functioning (DIF) was assessed for each item using ordinal logistic regression on estimated person scores for demographic subgroups (age group, gender, and parents’ education levels). All p-values are 2-sided with a significant level of 0.05. Multiple comparisons for DIF were assessed using Benjamini and Hochberg (BH) adjusted p-value to control for the false discovery rate [<xref ref-type="bibr" rid="pone.0299947.ref049">49</xref>, <xref ref-type="bibr" rid="pone.0299947.ref050">50</xref>]. Ten-item short forms were selected with higher slope estimations, wider threshold parameters, and fewer DIF problems.</p>
</sec>
<sec id="sec014">
<title>2.4.4. Classification algorithms</title>
<p>The short-form and demographic items were combined to improve performance. All nominal variables were one-hot encoded with one dummy variable for each category. A collection of seven Statistical or Machine Learning algorithms was compared: CatBoost [<xref ref-type="bibr" rid="pone.0299947.ref024">24</xref>], Logistic Regression, K-Nearest Neighbors (KNN), Naïve Bayes, single-hidden-layer Neural Network [<xref ref-type="bibr" rid="pone.0299947.ref027">27</xref>], Random Forest [<xref ref-type="bibr" rid="pone.0299947.ref025">25</xref>], and Support Vector Machine (SVM) with Radial Kernels [<xref ref-type="bibr" rid="pone.0299947.ref026">26</xref>]. As there is no universal best algorithm for all data, each of these methods has its unique strengths in classification. The technical details of these classification algorithms are listed in the <xref ref-type="supplementary-material" rid="pone.0299947.s004">S1 Appendix</xref>.</p>
<p>To standardize the data for all algorithms, we performed the pre-process based on the training data first and the corresponding test set was projected onto the space of training data to test the developed models. We used the BoxCox transformation for continuous variables. All predictors were normalized to make the scale comparable using centering and scaling. The guideline of the transparent reporting of a multivariable prediction model for individual prognosis or diagnosis (TRIPOD) checklist [<xref ref-type="bibr" rid="pone.0299947.ref051">51</xref>] was followed as outlined in the <xref ref-type="supplementary-material" rid="pone.0299947.s005">S2 Appendix</xref>.</p>
<p>All algorithms, except for Logistic Regression, had a broad selection of hyperparameters that could influence the prediction performance (See <xref ref-type="supplementary-material" rid="pone.0299947.s004">S1 Appendix</xref>). Cross-validation (CV) helps to fine-tuned hyperparameters using a metric. The Receiver Operating Characteristic (ROC) curve plots the true positive rate (sensitivity) and the false positive rate (1 –specificity) given various classification thresholds. The Area under the ROC (AUC) could measure the model performance on each cross-validation testing set.</p>
<p>To validate the performance efficiently on limited data and prevent overfitting, we repeated 5-fold Nested Cross-Validation (nCV) five times, as <xref ref-type="fig" rid="pone.0299947.g001">Fig 1</xref>. Each iteration within the inner loop utilized a fold for model validation and the rest for training. The models best-tuned by maximizing cross-validated AUC (CV-AUC) were evaluated on the corresponding testing set in the outer loop and CV-AUCs were aggregated.</p>
<fig id="pone.0299947.g001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0299947.g001</object-id>
<label>Fig 1</label>
<caption>
<title>Repeated 5-fold nested cross-validation.</title>
<p>(*: Median on performance metrics such as CV-AUCs, Sensitivity and Specificity on training-validation and testing sets).</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0299947.g001" xlink:type="simple"/>
</fig>
<p>Compared with the CV, nCV reduces bias of error estimation for the general performance, especially for sample sizes less than 1000 [<xref ref-type="bibr" rid="pone.0299947.ref052">52</xref>, <xref ref-type="bibr" rid="pone.0299947.ref053">53</xref>]. The inner loop is responsible for tuning the hyperparameters, while the outer loop estimates the generalization accuracy. Means and standard errors of testing CV-AUC medians across five repetitions were used to select the best algorithm for each short form. Cutoff points for classification were chosen to maximize the sum of sensitivity and specificity and ensure sensitivity greater than 0.85 on training data. Summary statistics of accuracy performance metrics were calculated, including sensitivity, and specificity, precision, and f1 score, on both training-validation and testing sets.</p>
<p>Machine learning algorithms often face a common challenge of class imbalance, as most learning algorithms are initially designed for balanced data. The training subsets within inner-loop cross-validation could be resampled using Synthetic Minority Over-Sampling Technique (SMOTE) [<xref ref-type="bibr" rid="pone.0299947.ref054">54</xref>], which has been shown to perform better on imbalanced classification compared to other resampling methods [<xref ref-type="bibr" rid="pone.0299947.ref055">55</xref>]. In SMOTE, the majority class is randomly under-sampled by removing data; while the minority class is over-sampled by creating "synthetic" examples based on its K-nearest Neighbors instead of bootstrapping with replacement. The best algorithm for each short form was selected from 14 algorithms in the combinations of one of seven statistical or Machine Learning algorithms with and without SMOTE. The algorithms were implemented using <italic>caret</italic> and <italic>DMwR</italic> packages in R 3.6.3 [<xref ref-type="bibr" rid="pone.0299947.ref056">56</xref>–<xref ref-type="bibr" rid="pone.0299947.ref058">58</xref>].</p>
</sec>
<sec id="sec015">
<title>2.4.5. Model summary</title>
<p>The short-form development initiated with CSRO and PPRO items on children’s oral health and yielded four separate item pools to develop short forms related to 1) <bold>AC-CSRO:</bold> child self-reported active caries, 2) <bold>RFUTN-CSRO:</bold> child self-reported urgent treatment needs, 3) <bold>AC-PPRO:</bold> parents’ perception of their children having active caries, and 4) <bold>RFUTN-PPRO:</bold> parents’ perception of their children needing a referral for urgent treatment. We identified short-form items using IRT. Items that were verified by assumption checks were calibrated with estimations of slopes and thresholds, DIFs, and ability scores recorded.</p>
<p>The four short forms with demographic information were further enhanced using seven algorithms with and without SMOTE for better prediction accuracy. The refined short forms are 1) <bold>AC-DEMO-CSRO</bold>: AC-CSRO short-form items with children-reported demographic information; 2) <bold>AC-DEMO-PPRO</bold>: AC-PPRO short-form with parent-reported demographic information; 3) <bold>AC-DEMO-CSRO-PPRO</bold>: AC-CSRO and AC-PPRO short-form items with all available demographic information; and another three for RFUTN as 4) <bold>RFUTN-DMO-CSRO</bold>; 5) <bold>RFUTN-DEMO-PPRO</bold>; 6) <bold>RFUTN-DEMO-CSRO-PPRO</bold>. Using the repeated nested cross-validation method, we selected the best algorithm with the maximized mean of the testing CV-AUC medians for each of the refined short forms.</p>
<p>R and Mplus code for IRT assumption validation, short form calibration, machine learning model fitting, and generating tables and figures are available at <ext-link ext-link-type="uri" xlink:href="https://github.com/dixiong777/COH_SF_IRTML" xlink:type="simple">https://github.com/dixiong777/COH_SF_IRTML</ext-link>.</p>
</sec>
</sec>
</sec>
<sec id="sec016" sec-type="results">
<title>3. Results</title>
<sec id="sec017">
<title>3.1. Participants</title>
<p>The sample included 497 dyads of children aged 8–17 years old and their parents with characteristics detailed in <xref ref-type="table" rid="pone.0299947.t001">Table 1</xref>. This cross-sectional study design and on-site computer-assisted survey ensured a complete data set without any missing survey responses or clinical exam results. Approximately one-quarter (24.3%) of the children had at least one tooth with untreated decay. The RFUTN cases were the 42.3% of children who were identified as needed to see a dentist within the next 2 weeks (22.3%) or immediately (19.9%).</p>
<table-wrap id="pone.0299947.t001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0299947.t001</object-id>
<label>Table 1</label> <caption><title>Characteristics of children and parents (N = 497).</title></caption>
<alternatives>
<graphic id="pone.0299947.t001g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0299947.t001" xlink:type="simple"/>
<table>
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left"/>
<th align="left">Variables</th>
<th align="center">Mean (SD) or No. (%)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center" rowspan="8"><bold>Clinical Outcomes</bold></td>
<td align="left">Active Caries</td>
<td align="left"/>
</tr>
<tr>
<td align="left"> No (AC = 0)</td>
<td align="center">376 (76%)</td>
</tr>
<tr>
<td align="left"> Yes (AC &gt; 0)</td>
<td align="center">121 (24%)</td>
</tr>
<tr>
<td align="left">Referral Recommendation</td>
<td align="center"/>
</tr>
<tr>
<td align="left"> Continue your routine care</td>
<td align="center">222 (45%)</td>
</tr>
<tr>
<td align="left"> See a dentist at your earliest convenience</td>
<td align="center">65 (13%)</td>
</tr>
<tr>
<td align="left"> See a dentist within the next 2 weeks</td>
<td align="center">111 (22%)</td>
</tr>
<tr>
<td align="left"> See a dentist immediately</td>
<td align="center">99 (20%)</td>
</tr>
<tr>
<td align="center" rowspan="22"><bold>Child-reported Characteristics</bold></td>
<td align="left">Children’s age, Mean (SD)</td>
<td align="center">12 (2.9)</td>
</tr>
<tr>
<td align="left">Children age group<xref ref-type="table-fn" rid="t001fn001"><sup>1</sup></xref></td>
<td align="left"/>
</tr>
<tr>
<td align="left"> 8–12</td>
<td align="center">290 (58%)</td>
</tr>
<tr>
<td align="left"> 13–17</td>
<td align="center">207 (42%)</td>
</tr>
<tr>
<td align="left">Children’s gender</td>
<td align="left"/>
</tr>
<tr>
<td align="left"> Male</td>
<td align="center">255 (51%)</td>
</tr>
<tr>
<td align="left"> Female</td>
<td align="center">241 (49%)</td>
</tr>
<tr>
<td align="left"> Female to male transgender</td>
<td align="center">1 (0%)</td>
</tr>
<tr>
<td align="left">Children’s race and ethnicity</td>
<td align="left"/>
</tr>
<tr>
<td align="left"> Caucasian/ White</td>
<td align="center">87 (18%)</td>
</tr>
<tr>
<td align="left"> Black/ African American</td>
<td align="center">43 (9%)</td>
</tr>
<tr>
<td align="left"> Hispanic/ Latino</td>
<td align="center">227 (46%)</td>
</tr>
<tr>
<td align="left"> Asian</td>
<td align="center">54 (11%)</td>
</tr>
<tr>
<td align="left"> Other</td>
<td align="center">86 (17%)</td>
</tr>
<tr>
<td align="left">Children’s primary language</td>
<td align="center"/>
</tr>
<tr>
<td align="left"> English</td>
<td align="center">429 (86%)</td>
</tr>
<tr>
<td align="left"> Other</td>
<td align="center">68 (14%)</td>
</tr>
<tr>
<td align="left">Number of children in the household</td>
<td align="center"/>
</tr>
<tr>
<td align="left"> 1</td>
<td align="center">177 (36%)</td>
</tr>
<tr>
<td align="left"> 2</td>
<td align="center">165 (33%)</td>
</tr>
<tr>
<td align="left"> 3</td>
<td align="center">79 (16%)</td>
</tr>
<tr>
<td align="left"> &gt; = 4</td>
<td align="center">76 (15%)</td>
</tr>
<tr>
<td align="center" rowspan="34"><bold>Parent-reported Characteristics</bold></td>
<td align="left">Parent’s age, Mean (SD)</td>
<td align="center">42.1 (8.8)</td>
</tr>
<tr>
<td align="left">Parent age group<xref ref-type="table-fn" rid="t001fn001"><sup>1</sup></xref></td>
<td align="center"/>
</tr>
<tr>
<td align="left"> &lt;30</td>
<td align="center">40 (8%)</td>
</tr>
<tr>
<td align="left"> 30–44</td>
<td align="center">262 (53%)</td>
</tr>
<tr>
<td align="left"> 45–59</td>
<td align="center">179 (36%)</td>
</tr>
<tr>
<td align="left">  &gt; = 60</td>
<td align="center">16 (3%)</td>
</tr>
<tr>
<td align="left">Parent’s gender</td>
<td align="center"/>
</tr>
<tr>
<td align="left"> Male</td>
<td align="center">131 (26%)</td>
</tr>
<tr>
<td align="left"> Female</td>
<td align="center">366 (74%)</td>
</tr>
<tr>
<td align="left">Children’s race and ethnicity</td>
<td align="center"/>
</tr>
<tr>
<td align="left"> Caucasian/ White</td>
<td align="center">78 (16%)</td>
</tr>
<tr>
<td align="left"> Black/ African American</td>
<td align="center">42 (9%)</td>
</tr>
<tr>
<td align="left"> Hispanic/ Latino</td>
<td align="center">242 (49%)</td>
</tr>
<tr>
<td align="left"> Asian</td>
<td align="center">46 (9%)</td>
</tr>
<tr>
<td align="left"> Other</td>
<td align="center">89 (18%)</td>
</tr>
<tr>
<td align="left">Parent’s race and ethnicity</td>
<td align="center"/>
</tr>
<tr>
<td align="left"> Caucasian/ White</td>
<td align="center">103 (21%)</td>
</tr>
<tr>
<td align="left"> Black/ African American</td>
<td align="center">42 (9%)</td>
</tr>
<tr>
<td align="left"> Hispanic/ Latino</td>
<td align="center">258 (52%)</td>
</tr>
<tr>
<td align="left"> Asian</td>
<td align="center">56 (11%)</td>
</tr>
<tr>
<td align="left"> Other</td>
<td align="center">38 (8%)</td>
</tr>
<tr>
<td align="left">Parent’s primary language</td>
<td align="center"/>
</tr>
<tr>
<td align="left"> English</td>
<td align="center">318 (64%)</td>
</tr>
<tr>
<td align="left"> Other</td>
<td align="center">179 (36%)</td>
</tr>
<tr>
<td align="left">Child has dental insurance</td>
<td align="center"/>
</tr>
<tr>
<td align="left"> No</td>
<td align="center">104 (21%)</td>
</tr>
<tr>
<td align="left"> Yes</td>
<td align="center">393 (79%)</td>
</tr>
<tr>
<td align="left">Parental employment status</td>
<td align="center"/>
</tr>
<tr>
<td align="left"> Full-time job</td>
<td align="center">382 (77%)</td>
</tr>
<tr>
<td align="left"> Part-time job</td>
<td align="center">54 (11%)</td>
</tr>
<tr>
<td align="left"> Not working</td>
<td align="center">61 (12%)</td>
</tr>
<tr>
<td align="left">Parent’s Marriage Status</td>
<td align="center"/>
</tr>
<tr>
<td align="left"> Married/ Living with Partner</td>
<td align="center">370 (74%)</td>
</tr>
<tr>
<td align="left"> Single</td>
<td align="center">127 (26%)</td>
</tr>
</tbody>
</table>
</alternatives>
<table-wrap-foot>
<fn id="t001fn001"><p><sup>1</sup>Characteristics not used for the prediction models.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="sec018">
<title>3.2. Model Development and specification</title>
<sec id="sec019">
<title>3.2.1. Data Preparation and IRT assumptions</title>
<p>After we checked the correlation with the target outcomes, we selected the screening item pools for <bold>AC-CSRO</bold> (17 items), <bold>RFUTN-CSRO</bold> (27 items), <bold>AC-PPRO</bold> (27 items), and <bold>RFUTN-PPRO</bold> (19 items). Two highly skewed items (skewness = 9.79, “tobacco use” for <bold>RFUTN-CSRO,</bold> and “hospital emergency needs in the last 12 months” for both <bold>AC-PPRO</bold> and <bold>RFUTN-PPRO</bold>) were further excluded.</p>
<p>Single-factor CFAs were estimated for the remaining 17 items for <bold>AC-CSRO</bold>, 26 items for <bold>RFUTN-CSRO</bold>, 26 items for <bold>AC-CSRO,</bold> and 18 items for <bold>RFUTN-PPRO</bold> at first. The initial fit indices for all four models were: <bold>AC-CSRO</bold> (CFI = 0.927, TLI = 0.916, RMSEA = 0.061), <bold>RFUTN-CSRO</bold> (CFI = 0.924, TLI = 0.918, RMSEA = 0.051), <bold>AC-PPRO</bold> (CFI = 0.852, TLI = 0.839, RMSEA = 0.070), and <bold>RFUTN-PPRO</bold> (CFI = 0.894, TLI = 0.880, RMSEA = 0.065).</p>
<p>For each pair of correlated items, items with higher accumulative correlations were considered as being locally dependent including three items for <bold>AC-CSRO</bold>, seven items for <bold>RFUTN-CSRO</bold>, five items for <bold>AC-PPRO,</bold> and nine items for <bold>RTFN-PPRO</bold>. For example, for <bold>RFUTN-CSRO</bold>, “peer jokes on how teeth look” was eliminated due to high residual correlations with five items ("miss school days”, “being afraid to see a dentist”, “brush teeth” “cognition of flossing teeth”, “parents as important people to oral health”, “medical providers as important people to oral health”).</p>
<p>With these local-dependent items removed, the final fit indices improved and produced adequate fit for all four models: <bold>AC-CSRO</bold> (12 items, CFI = 0.992, TLI = 0.990, RMSEA = 0.029), <bold>RFUTN-CSRO</bold> (19 items, CFI = 0.970, TLI = 0.966, RMSEA = 0.045), <bold>AC-PPRO</bold> (17 items, CFI = 0.952, TLI = 0.944, RMSEA = 0.057), and <bold>RFUTN-PPRO</bold> (15 items, CFI = 0.981, TLI = 0.978, RMSEA = 0.039). More details on the assumption checking are in <xref ref-type="supplementary-material" rid="pone.0299947.s001">S1 Data</xref>.</p>
</sec>
<sec id="sec020">
<title>3.2.2. IRT calibration and DIF analysis</title>
<p>The remaining items were calibrated to estimate item threshold and slope parameters (See more details in <xref ref-type="supplementary-material" rid="pone.0299947.s002">S2 Data</xref>). Ten-item short forms were selected with higher slope estimations, wider threshold parameters, and fewer flags for DIFs from the corresponding long forms, as presented in <xref ref-type="table" rid="pone.0299947.t002">Table 2</xref>.</p>
<table-wrap id="pone.0299947.t002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0299947.t002</object-id>
<label>Table 2</label> <caption><title>Item calibration statistics.</title></caption>
<alternatives>
<graphic id="pone.0299947.t002g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0299947.t002" xlink:type="simple"/>
<table>
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<tbody>
<tr>
<td align="left" colspan="7"><bold>a. 10-item AC-CSRO Short Form</bold></td>
</tr>
<tr>
<td align="center" rowspan="2"><bold>Items</bold></td>
<td align="center"><bold>Slope</bold> <xref ref-type="table-fn" rid="t002fn001"><sup>a</sup></xref></td>
<td align="center" colspan="5"><bold>Location Thresholds</bold></td>
</tr>
<tr>
<td align="center"/>
<td align="center">1</td>
<td align="center">2</td>
<td align="center">3</td>
<td align="center">4</td>
<td align="center">5</td>
</tr>
<tr>
<td align="left">It was hard for me to have fun because of the pain in my mouth.</td>
<td align="center">4.34</td>
<td align="center">5.92</td>
<td align="center">7.79</td>
<td align="center">9.95</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">It was hard for me to pay attention because of the pain in my mouth.</td>
<td align="center">4.17</td>
<td align="center">5.01</td>
<td align="center">7.03</td>
<td align="center">9.93</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">I felt stressed because of the pain in my mouth.</td>
<td align="center">3.86</td>
<td align="center">4.94</td>
<td align="center">6.60</td>
<td align="center">9.05</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">It was hard for me to talk because of the pain in my mouth.</td>
<td align="center">2.86</td>
<td align="center">4.05</td>
<td align="center">5.94</td>
<td align="center">7.36</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">It was hard for me to eat because of the pain in my mouth.</td>
<td align="center">2.51</td>
<td align="center">2.21</td>
<td align="center">4.04</td>
<td align="center">5.65</td>
<td align="center">6.47</td>
<td align="center"/>
</tr>
<tr>
<td align="left">In the last 4 weeks, how much of the time did you have pain or discomfort?</td>
<td align="center">1.50</td>
<td align="center">0.86</td>
<td align="center">2.17</td>
<td align="center">3.81</td>
<td align="center">4.66</td>
<td align="center"/>
</tr>
<tr>
<td align="left">In the last 4 weeks, how much of the time were you able to swallow comfortably?</td>
<td align="center">0.75</td>
<td align="center">1.21</td>
<td align="center">1.71</td>
<td align="center">1.91</td>
<td align="center">2.29</td>
<td align="center">2.53</td>
</tr>
<tr>
<td align="left">Did any of the following reasons ever keep you from visiting a dentist? My parents didn’t have any money for a dentist.</td>
<td align="center">0.49</td>
<td align="center">2.71</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">How much are you afraid to go to a dentist?</td>
<td align="center">0.41</td>
<td align="center">0.33</td>
<td align="center">2.05</td>
<td align="center">3.06</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">How often do you brush your teeth?</td>
<td align="center">0.38</td>
<td align="center">0.50</td>
<td align="center">2.26</td>
<td align="center">2.95</td>
<td align="center">3.28</td>
<td align="center"/>
</tr>
<tr>
<td align="left" colspan="7"><bold>b. 10-item RFUTN-CSRO Short Form</bold></td>
</tr>
<tr>
<td align="center" rowspan="2"><bold>Items</bold></td>
<td align="center"><bold>Slope</bold> <xref ref-type="table-fn" rid="t002fn001"><sup>a</sup></xref></td>
<td align="center" colspan="5"><bold>Location Thresholds</bold></td>
</tr>
<tr>
<td align="center"/>
<td align="center">1</td>
<td align="center">2</td>
<td align="center">3</td>
<td align="center">4</td>
<td align="center">5</td>
</tr>
<tr>
<td align="left">I felt stressed because of the pain in my mouth.</td>
<td align="center">4.58</td>
<td align="center">5.74</td>
<td align="center">7.52</td>
<td align="center">10.02</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">It was hard for me to pay attention because of the pain in my mouth.</td>
<td align="center">4.29</td>
<td align="center">5.84</td>
<td align="center">7.56</td>
<td align="center">9.49</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">It was hard for me to have fun because of the pain in my mouth.</td>
<td align="center">4.31</td>
<td align="center">5.17</td>
<td align="center">7.10</td>
<td align="center">9.79</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">It was hard for me to sleep because of the pain in my mouth.</td>
<td align="center">3.38</td>
<td align="center">4.69</td>
<td align="center">6.32</td>
<td align="center">8.28</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">It was hard for me to eat because of the pain in my mouth.</td>
<td align="center">2.85</td>
<td align="center">2.45</td>
<td align="center">4.38</td>
<td align="center">6.03</td>
<td align="center">6.85</td>
<td align="center"/>
</tr>
<tr>
<td align="left">It was hard for me to talk because of the pain in my mouth.</td>
<td align="center">3.03</td>
<td align="center">4.22</td>
<td align="center">6.08</td>
<td align="center">7.44</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">It hurts my teeth to chew.</td>
<td align="center">2.06</td>
<td align="center">2.14</td>
<td align="center">3.82</td>
<td align="center">6.06</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">I had a tooth that hurts.</td>
<td align="center">1.91</td>
<td align="center">1.44</td>
<td align="center">2.75</td>
<td align="center">4.62</td>
<td align="center">5.86</td>
<td align="center"/>
</tr>
<tr>
<td align="left">My mouth hurts.</td>
<td align="center">1.95</td>
<td align="center">1.32</td>
<td align="center">3.30</td>
<td align="center">5.74</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">During the last school year, how many days of school did you miss because of pain in the mouth, tongue, teeth, jaws, or gums?</td>
<td align="center">1.20</td>
<td align="center">3.31</td>
<td align="center">4.24</td>
<td align="center">1.20</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left" colspan="7"><bold>c. 10-item AC-PPRO Short Form</bold></td>
</tr>
<tr>
<td align="center" rowspan="2"><bold>Items</bold></td>
<td align="center"><bold>Slope</bold> <xref ref-type="table-fn" rid="t002fn001"><sup>a</sup></xref></td>
<td align="center" colspan="5"><bold>Location Thresholds</bold></td>
</tr>
<tr>
<td align="center"/>
<td align="center">1</td>
<td align="center">2</td>
<td align="center">3</td>
<td align="center">4</td>
<td align="center">5</td>
</tr>
<tr>
<td align="left">It was hard for my child to eat because of the pain in his/her mouth.</td>
<td align="center">4.36</td>
<td align="center">4.73</td>
<td align="center">7.30</td>
<td align="center">9.76</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">It hurts my child’s teeth to chew.</td>
<td align="center">3.69</td>
<td align="center">3.92</td>
<td align="center">6.26</td>
<td align="center">8.60</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">It was hard for my child to talk because of the pain in his/her mouth.</td>
<td align="center">3.63</td>
<td align="center">5.70</td>
<td align="center">7.67</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">My child’s mouth hurts.</td>
<td align="center">2.93</td>
<td align="center">2.60</td>
<td align="center">5.16</td>
<td align="center">7.69</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">My child’s gums hurt.</td>
<td align="center">2.92</td>
<td align="center">3.47</td>
<td align="center">5.26</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">My child had a tooth that hurts.</td>
<td align="center">2.78</td>
<td align="center">2.41</td>
<td align="center">4.10</td>
<td align="center">7.037</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">My child’s jaw hurts.</td>
<td align="center">2.59</td>
<td align="center">3.88</td>
<td align="center">5.57</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">During the last school year, how many days of school did your child miss because of pain in his/her mouth, tongue, teeth, or gums?</td>
<td align="center">1.30</td>
<td align="center">3.57</td>
<td align="center">4.33</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">During the last 12 months, did your child have an oral health problem?</td>
<td align="center">0.93</td>
<td align="center">1.23</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">In the last 4 weeks, how much of the time were you pleased or happy with the look of your child’s mouth, teeth, jaws, or gums?</td>
<td align="center">0.54</td>
<td align="center">-0.66</td>
<td align="center">0.86</td>
<td align="center">1.53</td>
<td align="center">2.82</td>
<td align="center">3.38</td>
</tr>
<tr>
<td align="left" colspan="7"><bold>d. 10-item RFUTN-PPRO Short Form</bold></td>
</tr>
<tr>
<td align="center" rowspan="2"><bold>Items</bold></td>
<td align="center"><bold>Slope</bold> <xref ref-type="table-fn" rid="t002fn001"><sup>a</sup></xref></td>
<td align="center" colspan="5"><bold>Location Thresholds</bold></td>
</tr>
<tr>
<td align="center"/>
<td align="center">1</td>
<td align="center">2</td>
<td align="center">3</td>
<td align="center">4</td>
<td align="center">5</td>
</tr>
<tr>
<td align="left">It was hard for my child to eat because of the pain in his/her mouth.</td>
<td align="center">3.90</td>
<td align="center">4.14</td>
<td align="center">6.64</td>
<td align="center">9.13</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">My child had a tooth that hurts.</td>
<td align="center">3.24</td>
<td align="center">2.63</td>
<td align="center">4.54</td>
<td align="center">7.95</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">My child’s gums hurt.</td>
<td align="center">2.59</td>
<td align="center">2.32</td>
<td align="center">4.71</td>
<td align="center">7.21</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">My child’s mouth hurts.</td>
<td align="center">2.60</td>
<td align="center">3.10</td>
<td align="center">4.82</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">During the last school year, how many days of school did your child miss because of pain in his/her mouth, tongue, teeth, or gums?</td>
<td align="center">1.29</td>
<td align="center">3.56</td>
<td align="center">4.32</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">During the past 12 months, was there a time that your child needed dental care but did not get it?</td>
<td align="center">1.01</td>
<td align="center">2.85</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">In the last 4 weeks, how much of the time were you pleased or happy with the look of your child’s mouth, teeth, jaws, or gums?</td>
<td align="center">0.70</td>
<td align="center">-0.68</td>
<td align="center">0.90</td>
<td align="center">1.59</td>
<td align="center">2.91</td>
<td align="center">3.47</td>
</tr>
<tr>
<td align="left">How much is your child afraid to go to a dentist?</td>
<td align="center">0.56</td>
<td align="center">0.40</td>
<td align="center">1.71</td>
<td align="center">3.15</td>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">Compared to other kids my child’s age:</td>
<td align="center">0.43</td>
<td align="center">-0.07</td>
<td align="center">3.19</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="left">How often do you remind your child to brush his/her teeth before he/she goes to sleep?</td>
<td align="center">0.28</td>
<td align="center">-3.01</td>
<td align="center">-1.93</td>
<td align="center">-0.88</td>
<td align="center">-0.47</td>
<td align="center">0.12</td>
</tr>
</tbody>
</table>
</alternatives>
<table-wrap-foot>
<fn id="t002fn001"><p><sup>a</sup>Items are ordered based on the size of their slopes.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>Short form items encompass various aspects, covering physical, mental, and social domains. Items concerning enjoyment, attention, and stress difficulties due to the pain had higher slopes and thresholds in CSRO short forms for both outcomes. It indicated that they were sensitive to distinguishing among children with poorer oral health. The AC-CSRO short form quired more questions related to functioning challenges due to oral health issues, while RFUTN-CSRO short form focuses on recent direct pain. Unlike these children short forms, in the parent short forms, the item about eating difficulty was more effective to identify children at risk with the highest slope and high location thresholds. These parent short forms included with more long-term pain questions. Comparing with the AC-PRRO short form, RFUTN-PPRO contains items on oral healthcare access, children’s fear of dental visit, and brushing habits, which were also in the AC-CSRO short form for children response.</p>
<p>The information curves for the short forms and their corresponding long forms are shown in <xref ref-type="supplementary-material" rid="pone.0299947.s003">S1 Fig</xref>.</p>
</sec>
<sec id="sec021">
<title>3.2.3. Classification</title>
<p>The calibrated short-form items were combined with demographic items listed in <xref ref-type="table" rid="pone.0299947.t001">Table 1</xref>. Our approach employing seven algorithms, each with and without SMOTE, through 5-fold nCV. The validations were repeated 5 times independently, resulting in 350 local fine-tuned best models using traditional 5-fold Cross-Validation (as 5 best-tuned models by 5-fold CV-AUC × 7 algorithms × 2 resampling options × 5 times) for each refined short-form. The prediction models were evaluated and compared, as detailed in <xref ref-type="table" rid="pone.0299947.t003">Table 3</xref>, to assess the classification performances of the short forms.</p>
<table-wrap id="pone.0299947.t003" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0299947.t003</object-id>
<label>Table 3</label> <caption><title>Estimated mean and standard errors of nCV-AUC median.</title></caption>
<alternatives>
<graphic id="pone.0299947.t003g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0299947.t003" xlink:type="simple"/>
<table>
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="center">Refined Short Form<xref ref-type="table-fn" rid="t003fn001"><sup>a</sup></xref></th>
<th align="center">Resampling</th>
<th align="center">CatBoost</th>
<th align="center">Logistic Regression</th>
<th align="center">K-Nearest Neighbors</th>
<th align="center">Naïve Bayes</th>
<th align="center">Neural Network</th>
<th align="center">Random Forest</th>
<th align="center">SVM with Radial Kernel</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center" rowspan="2">AC-DEMO-CSRO</td>
<td align="center">No</td>
<td align="center">0.61 (0.02)</td>
<td align="center">0.59 (0.01)</td>
<td align="center">0.61 (0.01)</td>
<td align="center"><bold>0.62 (0.00)</bold></td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.61 (0.01)</td>
<td align="center">0.60 (0.00)</td>
</tr>
<tr>
<td align="center">SMOTE</td>
<td align="center">0.59 (0.01)</td>
<td align="center">0.57 (0.01)</td>
<td align="center">0.61 (0.01)</td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.57 (0.01)</td>
<td align="center">0.58 (0.01)</td>
</tr>
<tr>
<td align="center" rowspan="2">AC-DEMO-PPRO</td>
<td align="center">No</td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.57 (0.02)</td>
<td align="center">0.58 (0.01)</td>
<td align="center"><bold>0.63 (0.00)</bold></td>
<td align="center">0.58 (0.01)</td>
<td align="center">0.60 (0.02)</td>
<td align="center">0.59 (0.01)</td>
</tr>
<tr>
<td align="center">SMOTE</td>
<td align="center">0.58 (0.01)</td>
<td align="center">0.55 (0.01)</td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.58 (0.01)</td>
<td align="center">0.58 (0.01)</td>
<td align="center">0.56 (0.01)</td>
</tr>
<tr>
<td align="center" rowspan="2" style="border-bottom-width:thick">AC-DEMO-CSRO-PPRO</td>
<td align="center">No</td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.56 (0.00)</td>
<td align="center">0.58 (0.01)</td>
<td align="center"><bold>0.64 (0.01)</bold></td>
<td align="center">0.58 (0.01)</td>
<td align="center">0.62 (0.01)</td>
<td align="center">0.60 (0.01)</td>
</tr>
<tr>
<td align="center" style="border-bottom-width:thick">SMOTE</td>
<td align="center" style="border-bottom-width:thick">0.58 (0.00)</td>
<td align="center" style="border-bottom-width:thick">0.55 (0.01)</td>
<td align="center" style="border-bottom-width:thick">0.59 (0.01)</td>
<td align="center" style="border-bottom-width:thick">0.56 (0.02)</td>
<td align="center" style="border-bottom-width:thick">0.57 (0.02)</td>
<td align="center" style="border-bottom-width:thick">0.58 (0.02)</td>
<td align="center" style="border-bottom-width:thick">0.56 (0.02)</td>
</tr>
<tr>
<td align="center" rowspan="2">RFUTN-DEMO-CSRO</td>
<td align="center">No</td>
<td align="center">0.58 (0.00)</td>
<td align="center">0.56 (0.01)</td>
<td align="center">0.59 (0.01)</td>
<td align="center">0.58 (0.01)</td>
<td align="center">0.57 (0.01)</td>
<td align="center">0.56 (0.01)</td>
<td align="center">0.60 (0.01)</td>
</tr>
<tr>
<td align="center">SMOTE</td>
<td align="center">0.57 (0.01)</td>
<td align="center">0.54 (0.01)</td>
<td align="center">0.57 (0.00)</td>
<td align="center"><bold>0.60 (0.01)</bold></td>
<td align="center">0.57 (0.01)</td>
<td align="center">0.54 (0.01)</td>
<td align="center">0.59 (0.01)</td>
</tr>
<tr>
<td align="center" rowspan="2">RFUTN-DEMO-PPRO</td>
<td align="center">No</td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.61 (0.00)</td>
<td align="center">0.59 (0.01)</td>
<td align="center"><bold>0.62 (0.00)</bold></td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.59 (0.01)</td>
<td align="center">0.61 (0.01)</td>
</tr>
<tr>
<td align="center">SMOTE</td>
<td align="center">0.58 (0.01)</td>
<td align="center">0.59 (0.01)</td>
<td align="center">0.57 (0.01)</td>
<td align="center">0.61 (0.01)</td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.57 (0.01)</td>
<td align="center">0.57 (0.00)</td>
</tr>
<tr>
<td align="center" rowspan="2">RFUTN-DEMO-CSRO-PPRO</td>
<td align="center">No</td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.58 (0.01)</td>
<td align="center">0.60 (0.01)</td>
<td align="center"><bold>0.62 (0.01)</bold></td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.60 (0.01)</td>
<td align="center">0.61 (0.01)</td>
</tr>
<tr>
<td align="center">SMOTE</td>
<td align="center">0.59 (0.01)</td>
<td align="center">0.57 (0.01)</td>
<td align="center">0.57 (0.01)</td>
<td align="center">0.61 (0.02)</td>
<td align="center">0.59 (0.01)</td>
<td align="center">0.58 (0.01)</td>
<td align="center">0.57 (0.01)</td>
</tr>
</tbody>
</table>
</alternatives>
<table-wrap-foot>
<fn id="t003fn001"><p><sup>a</sup> The best algorithm for each refined short form is in bold.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
</sec>
<sec id="sec022">
<title>3.3. Model performance</title>
<p>Naïve Bayes algorithm without SMOTE outperformed other algorithms for all refined short forms with higher nCV-AUC medians, except one (<bold>RFUTN-DEMO-CSRO</bold>) of which the best model was still Naïve Bayes but with SMOTE. Their prediction performance, including sensitivity, specificity, precision, and F1 score, on training-validation and testing sets for each refined short form are presented in <xref ref-type="table" rid="pone.0299947.t004">Table 4</xref>. Models incorporating both self-reported and proxy-reported responses showed a slightly higher predictive accuracy than those relying on either child-reported or proxy-reported responses.</p>
<table-wrap id="pone.0299947.t004" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0299947.t004</object-id>
<label>Table 4</label> <caption><title>Prediction performance on each refined short form based on the best algorithm.</title></caption>
<alternatives>
<graphic id="pone.0299947.t004g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0299947.t004" xlink:type="simple"/>
<table>
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="center" rowspan="2">Refined Short Form</th>
<th align="center" colspan="4">Training-validation Set</th>
<th align="center" colspan="4">Testing Set</th>
</tr>
<tr>
<th align="center">Sensitivity</th>
<th align="center">Specificity</th>
<th align="center">Precision</th>
<th align="center">F1 Score</th>
<th align="center">Sensitivity</th>
<th align="center">Specificity</th>
<th align="center">Precision</th>
<th align="center">F1 Score</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center">AC-DEMO-CSRO</td>
<td align="center">0.87 (0.01)</td>
<td align="center">0.33 (0.05)</td>
<td align="center">0.30 (0.01)</td>
<td align="center">0.45 (0.01)</td>
<td align="center">0.83 (0.02)</td>
<td align="center">0.29 (0.02)</td>
<td align="center">0.27 (0.00)</td>
<td align="center">0.42 (0.01)</td>
</tr>
<tr>
<td align="center">AC-DEMO-PPRO</td>
<td align="center">0.86 (0.01)</td>
<td align="center">0.36 (0.02)</td>
<td align="center">0.30 (0.01)</td>
<td align="center">0.45 (0.01)</td>
<td align="center">0.85 (0.06)</td>
<td align="center">0.31 (0.03)</td>
<td align="center">0.27 (0.01)</td>
<td align="center">0.42 (0.01)</td>
</tr>
<tr>
<td align="center" style="border-bottom-width:thick">AC-DEMO-CSRO-PPRO</td>
<td align="center" style="border-bottom-width:thick">0.87 (0.01)</td>
<td align="center" style="border-bottom-width:thick">0.35 (0.03)</td>
<td align="center" style="border-bottom-width:thick">0.31 (0.00)</td>
<td align="center" style="border-bottom-width:thick">0.45 (0.00)</td>
<td align="center" style="border-bottom-width:thick">0.84 (0.05)</td>
<td align="center" style="border-bottom-width:thick">0.30 (0.01)</td>
<td align="center" style="border-bottom-width:thick">0.27 (0.00)</td>
<td align="center" style="border-bottom-width:thick">0.42 (0.00)</td>
</tr>
<tr>
<td align="center">RFUTN-DEMO-CSRO</td>
<td align="center">0.86 (0.01)</td>
<td align="center">0.42 (0.04)</td>
<td align="center">0.46 (0.01)</td>
<td align="center">0.61 (0.01)</td>
<td align="center">0.77 (0.04)</td>
<td align="center">0.36 (0.04)</td>
<td align="center">0.44 (0.01)</td>
<td align="center">0.57 (0.02)</td>
</tr>
<tr>
<td align="center">RFUTN-DEMO-PPRO</td>
<td align="center">0.87 (0.02)</td>
<td align="center">0.24 (0.02)</td>
<td align="center">0.51 (0.01)</td>
<td align="center">0.64 (0.01)</td>
<td align="center">0.81 (0.03)</td>
<td align="center">0.18 (0.03)</td>
<td align="center">0.47 (0.00)</td>
<td align="center">0.59 (0.01)</td>
</tr>
<tr>
<td align="center">RFUTN-DEMO-CSRO-PPRO</td>
<td align="center">0.87 (0.03)</td>
<td align="center">0.39 (0.02)</td>
<td align="center">0.52 (0.01)</td>
<td align="center">0.65 (0.01)</td>
<td align="center">0.81 (0.06)</td>
<td align="center">0.31 (0.05)</td>
<td align="center">0.47 (0.01)</td>
<td align="center">0.59 (0.01)</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<p>Among 350 local fine-tuned CVs for each refined short form, models with the best testing performance were generated by different algorithms: KNN with SMOTE for <bold>AC-DEMO-PPRO</bold> (sensitivity = 0.84, specificity = 0.48), and <bold>AC-DEMO-CSRO-PPRO</bold> (sensitivity = 0.83, specificity = 0.45), <bold>RFUTN-DEMO-CSRO-PPRO</bold> (sensitivity = 0.83, specificity = 0.45); Radial Kernel SVM without SMOTE for <bold>AC-DEMO-CSRO</bold> (sensitivity = 0.83, specificity = 0.53), and <bold>RFUTN-DEMO-CSRO</bold> (sensitivity = 0.81, specificity = 0.53); CatBoost without SMOTE for <bold>RFUTN-DEMO-PPRO</bold> (sensitivity = 0.83, specificity = 0.52).</p>
</sec>
</sec>
<sec id="sec023" sec-type="conclusions">
<title>4. Discussion</title>
<p>This study aims to integrate the capabilities of IRT and machine learning to build survey short forms and predictive instruments for active caries and urgent treatment needs screening in large school-age populations.</p>
<p>We developed ten-item short forms for active caries and referral for urgent treatment needs based on children self-reported and parent proxy-reported information separately using IRT. The slopes and thresholds were the key parameters used for selecting variables that were independent of outcomes. These short forms provide high discriminability and wide thresholds to cover children with various health conditions.</p>
<p>Short forms based on child reports only, parent reports only, and child and parent reports collectively classified children using multiple statistical and machine learning algorithms. The Naïve Bayes outperformed other algorithms in general. For refined short forms using all CSRO and PPRO items, the average testing sensitivity and specificity were 0.84 and 0.30 for active caries, and 0.81 and 0.31 for RFUTN. The corresponding best testing sensitivities and specificities for local fine-tuned models were both 0.83 and 0.45 using KNN with SMOTE.</p>
<sec id="sec024">
<title>4.1. Study limitations</title>
<p>Although we included a diverse sample, it was a convenient sample drawn from children with a dental home, which does not represent the general school-age population. Moreover, the prediction performance of the short forms appears to be weak given the current samples. The classification accuracies increase with the increment of samples when the datasets have a good discriminative power between two classes [<xref ref-type="bibr" rid="pone.0299947.ref059">59</xref>]. Our survey questions about children’s oral health perceptions covered aspects of dental caries, missing teeth, and periodontal diseases, but they were not disease-specific. Parents and children responded to the surveys based on their perceptions of oral health, especially in the past three months or the last 12 months, which might affect concordance with oral exam results. In addition, some oral diseases are likely asymptomatic at an early disease stage and cannot be identified through self-reported survey questions.</p>
<p>To improve the survey protocol of oral health screening for school-age children, our ongoing work involves a more representative sample, more disease-specific survey questions, and the inclusion of various additional data sources.</p>
</sec>
<sec id="sec025">
<title>4.2. Interpretation</title>
<p>Self-reported enjoyment, attention and stress challenges due to pain were more effective in detecting children with active caries and urgent dental needs. It was more obvious to children to have a dental cavity when the pain caused functioning issues or need urgent dental care when they experienced recent pain; Parents, in contrast, identified kids’ oral health issues based on more long-term evidences. The predictive models showed a slightly higher predictive accuracy when combining child-reported or proxy-reported responses.</p>
<p>The short-form items in the short forms for the current study overlapped with most of the items identified in previous work on active caries, 60% for the children survey and 67% for the parent survey [<xref ref-type="bibr" rid="pone.0299947.ref034">34</xref>]. In addition to different sample sizes, the two studies used different optimization principles to select items. The previous study optimized prediction accuracy only, while this study also considered the interaction of survey items and responder’s underlying latent trait simultaneously using IRT, which is better for making predictions on general populations [<xref ref-type="bibr" rid="pone.0299947.ref011">11</xref>].</p>
<p>To investigate the general performance, we repeated algorithms five times for this study. The Repeated 5-fold Nested Cross-Validation helped to reduce the random uncertainty due to model instability and improved model accuracy while not solving overfitting issues completely. Additional external validation on new samples is also needed to ensure the reliability and validity of the developed short forms for the large population.</p>
<p>Because it is critical to identify patients with true active caries or treatment needs correctly for large populations, we traded off the cutoff point of classification thresholds to maintain a sensitivity at least of 85% in the training data sets, resulting in lower specificity rates. This paper only evaluated whether SMOTE resampling technique can help to improve the performance for this use case. In addition to the improve sample data quality, we can also implement other techniques, such as weighted class, under-sampling, data augmentations, and other resampling technique variants, to improve the classification performance for imbalanced class data.</p>
<p>The predictive accuracy can be further enhanced when integrated with other types of data, even with small sample data. A caries risk prediction model using a random forest achieved a test AUC as 0.73 based on oral health questionnaire responses and genetic markers, Single nucleotide polymorphisms (SNPs) [<xref ref-type="bibr" rid="pone.0299947.ref060">60</xref>]. With previous caries history and acidogenicity of dental biofilms, the test AUC of the caries risk models was 0.78 [<xref ref-type="bibr" rid="pone.0299947.ref061">61</xref>].</p>
</sec>
<sec id="sec026">
<title>4.3. Implications</title>
<p>The oral health assessment short forms have highly significant value in potentially overcoming longstanding public health challenges in oral health assessment for large populations of children. Such screening supplement of the clinical examinations, yet to be highly accurate, can help to identify the sub-cohort children who are most vulnerable. Schools and families can more effectively monitor oral health changes. Additional notable strengths include (i) ability to implement through electronic platforms, such as a computer or mobile device, and easy use in large populations; (ii) reduces the need for oral health professionals, thereby lowering cost and making surveillance more feasible and sustainable; (iii) ability to be used by a wide range of individuals and in a wide range of settings; (iv) reduced risk of disease transmission from person-to-person contact, thereby allowing for surveillance during COVID-19 or other future pandemics.</p>
<p>In our continued efforts to improve the classification accuracy, especially on low specificities, we will refine the survey based on the current findings on item characteristics and prediction performance. We will target to more specific dental diseases of interest with direct oral health questions, such as teeth observations, home relief medications, and treatment history. Furthermore, other types of study design and data collection methods have also been considered for our future work. Due to the dynamic dental disease status, it will be more useful to provide a more precise recall interval. Compared to the cross-sectional study, the longitudinal study is a better option to validate the recall referral recommendation and track the progression of oral health diseases [<xref ref-type="bibr" rid="pone.0299947.ref062">62</xref>, <xref ref-type="bibr" rid="pone.0299947.ref063">63</xref>]. Moreover, linking the survey protocol to other data sources, especially intraoral images [<xref ref-type="bibr" rid="pone.0299947.ref016">16</xref>, <xref ref-type="bibr" rid="pone.0299947.ref054">54</xref>, <xref ref-type="bibr" rid="pone.0299947.ref055">55</xref>], is expected to boost screening accuracy with machine learning and deep learning algorithms.</p>
</sec>
</sec>
<sec id="sec027" sec-type="conclusions">
<title>5. Conclusions</title>
<p>This study developed short forms to identify children who have active caries and/or urgent treatment needs. The proposed framework for short-form development integrates the strength of both IRT and machine learning to enhance clinical decision support. The short forms and this line of research hold the potential to overcome challenges associated with oral health screening for large populations of school-age children.</p>
</sec>
<sec id="sec028" sec-type="supplementary-material">
<title>Supporting information</title>
<supplementary-material id="pone.0299947.s001" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" position="float" xlink:href="info:doi/10.1371/journal.pone.0299947.s001" xlink:type="simple">
<label>S1 Data</label>
<caption>
<title>Aggregated data for assumption checking.</title>
<p>(XLSX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0299947.s002" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" position="float" xlink:href="info:doi/10.1371/journal.pone.0299947.s002" xlink:type="simple">
<label>S2 Data</label>
<caption>
<title>Item calibration statistics for long forms.</title>
<p>(XLSX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0299947.s003" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0299947.s003" xlink:type="simple">
<label>S1 Fig</label>
<caption>
<title>Information curves of long-form and short-form for AC and RFUTN models.</title>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0299947.s004" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0299947.s004" xlink:type="simple">
<label>S1 Appendix</label>
<caption>
<title>Technical details of the classification algorithms.</title>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0299947.s005" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0299947.s005" xlink:type="simple">
<label>S2 Appendix</label>
<caption>
<title>TRIPOD checklist.</title>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0299947.s006" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0299947.s006" xlink:type="simple">
<label>S3 Appendix</label>
<caption>
<title>List of abbreviations.</title>
<p>(DOCX)</p>
</caption>
</supplementary-material>
</sec>
</body>
<back>
<ack>
<p>We would like to acknowledge the following individuals for their assistance in both recruiting patients and providing the space for the field testing: Dr. Suzanne Berger, Dr. Christie Burnett, Dr. Adrienne Fang, Dr. Roger Fieldman, Ms. Dale Gorman, Dr. Karen Ho, Ms. Lucy Juarez, Dr. Oariona Lowe, Mr. Pastor Miranda, Dr. Evangelos Rossopoulos, Dr. Megha Sata, Dr. Justin Shuffer and Ms. Audrey Simons, and Mr. Dennis Young.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="pone.0299947.ref001"><label>1</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Benjamin</surname> <given-names>RM</given-names></name>. <article-title>Oral health: the silent epidemic</article-title>. <source>Public Health Reports</source> <year>2010</year>;<volume>125</volume>:<fpage>158</fpage>–<lpage>9</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1177/003335491012500202" xlink:type="simple">10.1177/003335491012500202</ext-link></comment> <object-id pub-id-type="pmid">20297740</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref002"><label>2</label><mixed-citation publication-type="other" xlink:type="simple">Kozol J. Savage inequalities: Children in America’s schools. Crown; 2012.</mixed-citation></ref>
<ref id="pone.0299947.ref003"><label>3</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Jackson</surname> <given-names>SL</given-names></name>, <name name-style="western"><surname>Vann</surname> <given-names>WF</given-names></name>, <name name-style="western"><surname>Kotch</surname> <given-names>JB</given-names></name>, <name name-style="western"><surname>Pahel</surname> <given-names>BT</given-names></name>, <name name-style="western"><surname>Lee</surname> <given-names>JY</given-names></name>. <article-title>Impact of poor oral health on children’s school attendance and performance</article-title>. <source>Am J Public Health</source> <year>2011</year>;<volume>101</volume>:<fpage>1900</fpage>–<lpage>6</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.2105/AJPH.2010.200915" xlink:type="simple">10.2105/AJPH.2010.200915</ext-link></comment> <object-id pub-id-type="pmid">21330579</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref004"><label>4</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Olszewska</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Rzymski</surname> <given-names>P</given-names></name>. <article-title>Children’s Dental Anxiety during the COVID-19 Pandemic: Polish Experience</article-title>. <source>J Clin Med</source> <year>2020</year>;<volume>9</volume>:<fpage>2751</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3390/jcm9092751" xlink:type="simple">10.3390/jcm9092751</ext-link></comment> <object-id pub-id-type="pmid">32854401</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref005"><label>5</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Raviv</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Warren</surname> <given-names>CM</given-names></name>, <name name-style="western"><surname>Washburn</surname> <given-names>JJ</given-names></name>, <name name-style="western"><surname>Kanaley</surname> <given-names>MK</given-names></name>, <name name-style="western"><surname>Eihentale</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Goldenthal</surname> <given-names>HJ</given-names></name>, <etal>et al</etal>. <article-title>Caregiver Perceptions of Children’s Psychological Well-being During the COVID-19 Pandemic</article-title>. <source>JAMA Netw Open</source> <year>2021</year>;<volume>4</volume>:<fpage>e2111103</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1001/jamanetworkopen.2021.11103" xlink:type="simple">10.1001/jamanetworkopen.2021.11103</ext-link></comment> <object-id pub-id-type="pmid">33914046</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref006"><label>6</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Monsantofils</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Bernabé</surname> <given-names>E</given-names></name>. <article-title>Oral impacts on daily performances and recent use of dental services in schoolchildren</article-title>. <source>Int J Paediatr Dent</source> <year>2014</year>;<volume>24</volume>:<fpage>417</fpage>–<lpage>23</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/ipd.12087" xlink:type="simple">10.1111/ipd.12087</ext-link></comment> <object-id pub-id-type="pmid">25430514</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref007"><label>7</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Pahel</surname> <given-names>BT</given-names></name>, <name name-style="western"><surname>Rozier</surname> <given-names>RG</given-names></name>, <name name-style="western"><surname>Slade</surname> <given-names>GD</given-names></name>. <article-title>Parental perceptions of children’s oral health: The Early Childhood Oral Health Impact Scale (ECOHIS)</article-title>. <source>Health Qual Life Outcomes</source> <year>2007</year>;<volume>5</volume>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1477-7525-5-6" xlink:type="simple">10.1186/1477-7525-5-6</ext-link></comment> <object-id pub-id-type="pmid">17263880</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref008"><label>8</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Jokovic</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Locker</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Guyatt</surname> <given-names>G</given-names></name>. <article-title>Short forms of the Child Perceptions Questionnaire for 11–14-year-old children (CPQ11–14): Development and initial evaluation</article-title>. <source>Health Qual Life Outcomes</source> <year>2006</year>;<volume>4</volume>:<fpage>4</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1477-7525-4-4" xlink:type="simple">10.1186/1477-7525-4-4</ext-link></comment> <object-id pub-id-type="pmid">16423298</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref009"><label>9</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Genderson</surname> <given-names>MW</given-names></name>, <name name-style="western"><surname>Sischo</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Markowitz</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Fine</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Broder</surname> <given-names>HL</given-names></name>. <article-title>An Overview of Children’s Oral Health-Related Quality of Life Assessment: From Scale Development to Measuring Outcomes</article-title>. <source>Caries Res</source> <year>2013</year>;<volume>47</volume>:<fpage>13</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1159/000351693" xlink:type="simple">10.1159/000351693</ext-link></comment> <object-id pub-id-type="pmid">24107604</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref010"><label>10</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kline</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Kline</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>SH Abad</surname> <given-names>Z</given-names></name>, <name name-style="western"><surname>Lee</surname> <given-names>J</given-names></name>. <article-title>Using item response theory for explainable machine learning in predicting mortality in the intensive care unit: Case-based approach</article-title>. <source>J Med Internet Res</source> <year>2020</year>;<volume>22</volume>:<fpage>e20268</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.2196/20268" xlink:type="simple">10.2196/20268</ext-link></comment> <object-id pub-id-type="pmid">32975523</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref011"><label>11</label><mixed-citation publication-type="other" xlink:type="simple">Kline A, Kline T, Hossein Abad ZS, Lee J. Novel Feature Selection for Artificial Intelligence Using Item Response Theory for Mortality Prediction. Proceedings of the Annual International Conference of the IEEE Engineering in Medicine and Biology Society, EMBS, vol. 2020- July, Institute of Electrical and Electronics Engineers Inc.; 2020, p. 5729–32.</mixed-citation></ref>
<ref id="pone.0299947.ref012"><label>12</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Cooper</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Petrides</surname> <given-names>K V</given-names></name>. <article-title>A psychometric analysis of the Trait Emotional Intelligence Questionnaire-Short Form (TEIQue-SF) using item response theory</article-title>. <source>J Pers Assess</source> <year>2010</year>;<volume>92</volume>:<fpage>449</fpage>–<lpage>57</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1080/00223891.2010.497426" xlink:type="simple">10.1080/00223891.2010.497426</ext-link></comment> <object-id pub-id-type="pmid">20706931</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref013"><label>13</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Costa</surname> <given-names>DSJ</given-names></name>, <name name-style="western"><surname>Asghari</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Nicholas</surname> <given-names>MK</given-names></name>. <article-title>Item response theory analysis of the Pain Self-Efficacy Questionnaire</article-title>. <source>Scand J Pain</source> <year>2017</year>;<volume>14</volume>:<fpage>113</fpage>–<lpage>7</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.sjpain.2016.08.001" xlink:type="simple">10.1016/j.sjpain.2016.08.001</ext-link></comment> <object-id pub-id-type="pmid">28850425</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref014"><label>14</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Glas</surname> <given-names>CAW</given-names></name>. <article-title>Item response theory in educational assessment and evaluation</article-title>. <source>Mes Eval Educ</source> <year>2014</year>;<volume>31</volume>:<fpage>19</fpage>–<lpage>34</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.7202/1025005AR" xlink:type="simple">10.7202/1025005AR</ext-link></comment></mixed-citation></ref>
<ref id="pone.0299947.ref015"><label>15</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Zanon</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Hutz</surname> <given-names>CS</given-names></name>, <name name-style="western"><surname>Yoo</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Hambleton</surname> <given-names>RK</given-names></name>. <article-title>An application of item response theory to psychological test development</article-title>. <source>Psicologia: Reflexao e Critica</source> <year>2016</year>;<volume>29</volume>:<fpage>1</fpage>–<lpage>10</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/S41155-016-0040-X/FIGURES/3" xlink:type="simple">10.1186/S41155-016-0040-X/FIGURES/3</ext-link></comment></mixed-citation></ref>
<ref id="pone.0299947.ref016"><label>16</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Nguyen</surname> <given-names>TH</given-names></name>, <name name-style="western"><surname>Han</surname> <given-names>HR</given-names></name>, <name name-style="western"><surname>Kim</surname> <given-names>MT</given-names></name>, <name name-style="western"><surname>Chan</surname> <given-names>KS</given-names></name>. <article-title>An introduction to item response theory for patient-reported outcome measurement</article-title>. <source>Patient</source> <year>2014</year>;<volume>7</volume>:<fpage>23</fpage>–<lpage>35</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s40271-013-0041-0" xlink:type="simple">10.1007/s40271-013-0041-0</ext-link></comment> <object-id pub-id-type="pmid">24403095</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref017"><label>17</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Stover</surname> <given-names>AM</given-names></name>, <name name-style="western"><surname>McLeod</surname> <given-names>LD</given-names></name>, <name name-style="western"><surname>Langer</surname> <given-names>MM</given-names></name>, <name name-style="western"><surname>Chen</surname> <given-names>WH</given-names></name>, <name name-style="western"><surname>Reeve</surname> <given-names>BB</given-names></name>. <article-title>State of the psychometric methods: patient-reported outcome measure development and refinement using item response theory</article-title>. <source>J Patient Rep Outcomes</source> <year>2019</year>;<volume>3</volume>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/s41687-019-0130-5" xlink:type="simple">10.1186/s41687-019-0130-5</ext-link></comment> <object-id pub-id-type="pmid">31359210</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref018"><label>18</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Shaw</surname> <given-names>AM</given-names></name>, <name name-style="western"><surname>Rogge</surname> <given-names>RD</given-names></name>. <article-title>Evaluating and Refining the Construct of Sexual Quality With Item Response Theory: Development of the Quality of Sex Inventory</article-title>. <source>Arch Sex Behav</source> <year>2016</year>;<volume>45</volume>:<fpage>249</fpage>–<lpage>70</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s10508-015-0650-x" xlink:type="simple">10.1007/s10508-015-0650-x</ext-link></comment> <object-id pub-id-type="pmid">26728053</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref019"><label>19</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Edelen</surname> <given-names>MO</given-names></name>, <name name-style="western"><surname>Reeve</surname> <given-names>BB</given-names></name>. <article-title>Applying item response theory (IRT) modeling to questionnaire development, evaluation, and refinement</article-title>. <source>Quality of Life Research</source> <year>2007</year>;<volume>16</volume>:<fpage>5</fpage>–<lpage>18</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s11136-007-9198-0" xlink:type="simple">10.1007/s11136-007-9198-0</ext-link></comment> <object-id pub-id-type="pmid">17375372</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref020"><label>20</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Hung</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Voss</surname> <given-names>MW</given-names></name>, <name name-style="western"><surname>Rosales</surname> <given-names>MN</given-names></name>, <name name-style="western"><surname>Li</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Su</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Xu</surname> <given-names>J</given-names></name>, <etal>et al</etal>. <article-title>Application of machine learning for diagnostic prediction of root caries</article-title>. <source>Gerodontology</source> <year>2019</year>;<volume>36</volume>:<fpage>395</fpage>–<lpage>404</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/ger.12432" xlink:type="simple">10.1111/ger.12432</ext-link></comment> <object-id pub-id-type="pmid">31274221</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref021"><label>21</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Adeoye</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Tan</surname> <given-names>JY</given-names></name>, <name name-style="western"><surname>Choi</surname> <given-names>SW</given-names></name>, <name name-style="western"><surname>Thomson</surname> <given-names>P</given-names></name>. <article-title>Prediction models applying machine learning to oral cavity cancer outcomes: A systematic review</article-title>. <source>Int J Med Inform</source> <year>2021</year>;<volume>154</volume>:<fpage>104557</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.ijmedinf.2021.104557" xlink:type="simple">10.1016/j.ijmedinf.2021.104557</ext-link></comment> <object-id pub-id-type="pmid">34455119</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref022"><label>22</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>You</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Hao</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Li</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Xia</surname> <given-names>B</given-names></name>. <article-title>Deep learning-based dental plaque detection on primary teeth: A comparison with clinical assessments</article-title>. <source>BMC Oral Health</source> <year>2020</year>;<volume>20</volume>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/s12903-020-01114-6" xlink:type="simple">10.1186/s12903-020-01114-6</ext-link></comment> <object-id pub-id-type="pmid">32404094</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref023"><label>23</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Carrillo-Perez</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Pecho</surname> <given-names>OE</given-names></name>, <name name-style="western"><surname>Morales</surname> <given-names>JC</given-names></name>, <name name-style="western"><surname>Paravina</surname> <given-names>RD</given-names></name>, <name name-style="western"><surname>Della Bona</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Ghinea</surname> <given-names>R</given-names></name>, <etal>et al</etal>. <article-title>Applications of artificial intelligence in dentistry: A comprehensive review</article-title>. <source>Journal of Esthetic and Restorative Dentistry</source> <year>2022</year>;<volume>34</volume>:<fpage>259</fpage>–<lpage>80</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/jerd.12844" xlink:type="simple">10.1111/jerd.12844</ext-link></comment> <object-id pub-id-type="pmid">34842324</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref024"><label>24</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Prokhorenkova</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Gusev</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Vorobev</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Dorogush</surname> <given-names>AV</given-names></name>, <name name-style="western"><surname>Gulin</surname> <given-names>A</given-names></name>. <article-title>CatBoost: unbiased boosting with categorical features</article-title>. <source>Adv Neural Inf Process Syst</source> <year>2017</year>;2018-<month>December</month>:<fpage>6638</fpage>–<lpage>48</lpage>.</mixed-citation></ref>
<ref id="pone.0299947.ref025"><label>25</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Biau</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Scornet</surname> <given-names>E</given-names></name>. <article-title>A random forest guided tour</article-title>. <source>Test</source> <year>2016</year>;<volume>25</volume>:<fpage>197</fpage>–<lpage>227</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s11749-016-0481-7" xlink:type="simple">10.1007/s11749-016-0481-7</ext-link></comment></mixed-citation></ref>
<ref id="pone.0299947.ref026"><label>26</label><mixed-citation publication-type="book" xlink:type="simple"><name name-style="western"><surname>Suthaharan</surname> <given-names>S.</given-names></name> <source>Support Vector Machine</source>, <publisher-name>Springer</publisher-name>, <publisher-loc>Boston, MA</publisher-loc>; <year>2016</year>, p. <fpage>207</fpage>–<lpage>35</lpage>.</mixed-citation></ref>
<ref id="pone.0299947.ref027"><label>27</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Dreiseitl</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Ohno-Machado</surname> <given-names>L</given-names></name>. <article-title>Logistic regression and artificial neural network classification models: A methodology review</article-title>. <source>J Biomed Inform</source> <year>2002</year>;<volume>35</volume>:<fpage>352</fpage>–<lpage>9</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/s1532-0464%2803%2900034-0" xlink:type="simple">10.1016/s1532-0464(03)00034-0</ext-link></comment> <object-id pub-id-type="pmid">12968784</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref028"><label>28</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wang</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Hays</surname> <given-names>RD</given-names></name>, <name name-style="western"><surname>Marcus</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Maida</surname> <given-names>CA</given-names></name>, <name name-style="western"><surname>Shen</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Xiong</surname> <given-names>D</given-names></name>, <etal>et al</etal>. <article-title>Developing Children’s Oral Health Assessment Toolkits Using Machine Learning Algorithm</article-title>. <source>JDR Clin Trans Res</source> <year>2020</year>;<volume>5</volume>:<fpage>233</fpage>–<lpage>43</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1177/2380084419885612" xlink:type="simple">10.1177/2380084419885612</ext-link></comment> <object-id pub-id-type="pmid">31710817</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref029"><label>29</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Yoon</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Choi</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Odlum</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Mitchell</surname> <given-names>DA</given-names></name>, <name name-style="western"><surname>Kronish</surname> <given-names>IM</given-names></name>, <name name-style="western"><surname>Davidson</surname> <given-names>KW</given-names></name>, <etal>et al</etal>. <article-title>Machine Learning to Identify Behavioral Determinants of Oral Health in Inner City Older Hispanic Adults</article-title>. <source>Stud Health Technol Inform</source> <year>2018</year>;<volume>251</volume>:<fpage>253</fpage>–<lpage>6</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3233/978-1-61499-880-8-253" xlink:type="simple">10.3233/978-1-61499-880-8-253</ext-link></comment> <object-id pub-id-type="pmid">29968651</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref030"><label>30</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Chu</surname> <given-names>CS</given-names></name>, <name name-style="western"><surname>Lee</surname> <given-names>NP</given-names></name>, <name name-style="western"><surname>Adeoye</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Thomson</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Choi</surname> <given-names>SW</given-names></name>. <article-title>Machine learning and treatment outcome prediction for oral cancer</article-title>. <source>Journal of Oral Pathology and Medicine</source> <year>2020</year>;<volume>49</volume>:<fpage>977</fpage>–<lpage>85</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/jop.13089" xlink:type="simple">10.1111/jop.13089</ext-link></comment> <object-id pub-id-type="pmid">32740951</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref031"><label>31</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Hung</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Hon</surname> <given-names>ES</given-names></name>, <name name-style="western"><surname>Ruiz-Negron</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Lauren</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Moffat</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Su</surname> <given-names>W</given-names></name>, <etal>et al</etal>. <article-title>Exploring the Intersection between Social Determinants of Health and Unmet Dental Care Needs Using Deep Learning</article-title>. <source>Int J Environ Res Public Health</source> <year>2020</year>;<volume>17</volume>:<fpage>7286</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3390/ijerph17197286" xlink:type="simple">10.3390/ijerph17197286</ext-link></comment> <object-id pub-id-type="pmid">33036152</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref032"><label>32</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Liu</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Hays</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Marcus</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Maida</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Shen</surname> <given-names>J</given-names></name>, <etal>et al</etal>. <article-title>Short form development for oral health patient-reported outcome evaluation in children and adolescents</article-title>. <source>Quality of Life Research</source> <year>2018</year>;<volume>27</volume>:<fpage>1599</fpage>–<lpage>611</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s11136-018-1820-9" xlink:type="simple">10.1007/s11136-018-1820-9</ext-link></comment> <object-id pub-id-type="pmid">29508207</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref033"><label>33</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wang</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Hays</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Marcus</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Maida</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Shen</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Xiong</surname> <given-names>D</given-names></name>, <etal>et al</etal>. <article-title>Development of a parents’ short form survey of their children’s oral health</article-title>. <source>Int J Paediatr Dent</source> <year>2019</year>;<volume>29</volume>:<fpage>332</fpage>–<lpage>44</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/ipd.12453" xlink:type="simple">10.1111/ipd.12453</ext-link></comment> <object-id pub-id-type="pmid">30481390</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref034"><label>34</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Marcus</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Xiong</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Maida</surname> <given-names>CA</given-names></name>, <name name-style="western"><surname>Hays</surname> <given-names>RD</given-names></name>, <name name-style="western"><surname>Coulter</surname> <given-names>ID</given-names></name>, <etal>et al</etal>. <article-title>Development of toolkits for detecting dental caries and caries experience among children using self-report and parent report</article-title>. <source>Community Dent Oral Epidemiol</source> <year>2019</year>;<volume>47</volume>:<fpage>520</fpage>–<lpage>7</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/cdoe.12494" xlink:type="simple">10.1111/cdoe.12494</ext-link></comment> <object-id pub-id-type="pmid">31576591</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref035"><label>35</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Liu</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Hays</surname> <given-names>RD</given-names></name>, <name name-style="western"><surname>Marcus</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Coulter</surname> <given-names>I</given-names></name>, <name name-style="western"><surname>Maida</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Ramos-Gomez</surname> <given-names>F</given-names></name>, <etal>et al</etal>. <article-title>Patient-Reported oral health outcome measurement for children and adolescents</article-title>. <source>BMC Oral Health</source> <year>2016</year>;<volume>16</volume>:<fpage>1</fpage>–<lpage>9</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/s12903-016-0293-x" xlink:type="simple">10.1186/s12903-016-0293-x</ext-link></comment> <object-id pub-id-type="pmid">27634621</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref036"><label>36</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Byrt</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Bishop</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Carlin</surname> <given-names>JB</given-names></name>. <article-title>Bias, prevalence and kappa</article-title>. <source>J Clin Epidemiol</source> <year>1993</year>;<volume>46</volume>:<fpage>423</fpage>–<lpage>9</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/0895-4356%2893%2990018-v" xlink:type="simple">10.1016/0895-4356(93)90018-v</ext-link></comment> <object-id pub-id-type="pmid">8501467</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref037"><label>37</label><mixed-citation publication-type="other" xlink:type="simple">Reliability KG-SM for I-R, 2002 undefined. Inter-rater reliability: dependency on trait prevalence and marginal homogeneity. Citeseer 2002.</mixed-citation></ref>
<ref id="pone.0299947.ref038"><label>38</label><mixed-citation publication-type="other" xlink:type="simple">National Center for Health Statistics (NCHS). National health and nutrition examination survey (NHANES), oral health examiners manual 2013. <ext-link ext-link-type="uri" xlink:href="https://wwwn.cdc.gov/nchs/data/nhanes/2013-2014/manuals/Oral_Health_Examiners.pdf" xlink:type="simple">https://wwwn.cdc.gov/nchs/data/nhanes/2013-2014/manuals/Oral_Health_Examiners.pdf</ext-link> (accessed January 25, 2021).</mixed-citation></ref>
<ref id="pone.0299947.ref039"><label>39</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Maida</surname> <given-names>CA</given-names></name>, <name name-style="western"><surname>Marcus</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Hays</surname> <given-names>RD</given-names></name>, <name name-style="western"><surname>Coulter</surname> <given-names>ID</given-names></name>, <name name-style="western"><surname>Ramos-Gomez</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Lee</surname> <given-names>SY</given-names></name>, <etal>et al</etal>. <article-title>Qualitative methods in the development of a parent survey of children’s oral health status</article-title>. <source>J Patient Rep Outcomes</source> <year>2018</year>;<volume>2</volume>:<fpage>1</fpage>–<lpage>18</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/s41687-018-0033-x" xlink:type="simple">10.1186/s41687-018-0033-x</ext-link></comment> <object-id pub-id-type="pmid">29757326</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref040"><label>40</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Rose</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Bjorner</surname> <given-names>JB</given-names></name>, <name name-style="western"><surname>Gandek</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Bruce</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Fries</surname> <given-names>JF</given-names></name>, <name name-style="western"><surname>Ware</surname> <given-names>JE</given-names></name>. <article-title>The PROMIS Physical Function item bank was calibrated to a standardized metric and shown to improve measurement efficiency</article-title>. <source>J Clin Epidemiol</source> <year>2014</year>;<volume>67</volume>:<fpage>516</fpage>–<lpage>26</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.jclinepi.2013.10.024" xlink:type="simple">10.1016/j.jclinepi.2013.10.024</ext-link></comment> <object-id pub-id-type="pmid">24698295</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref041"><label>41</label><mixed-citation publication-type="book" xlink:type="simple"><name name-style="western"><surname>Samejima</surname> <given-names>F.</given-names></name> <chapter-title>Graded Response Model</chapter-title>. <source>Handbook of Modern Item Response Theory</source>, <publisher-name>Springer</publisher-name> <publisher-loc>New York</publisher-loc>; <year>1997</year>, p. <fpage>85</fpage>–<lpage>100</lpage>.</mixed-citation></ref>
<ref id="pone.0299947.ref042"><label>42</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Reeve</surname> <given-names>BB</given-names></name>, <name name-style="western"><surname>Hays</surname> <given-names>RD</given-names></name>, <name name-style="western"><surname>Bjorner</surname> <given-names>JB</given-names></name>, <name name-style="western"><surname>Cook</surname> <given-names>KF</given-names></name>, <name name-style="western"><surname>Crane</surname> <given-names>PK</given-names></name>, <name name-style="western"><surname>Teresi</surname> <given-names>JA</given-names></name>, <etal>et al</etal>. <article-title>Psychometric Evaluation and Calibration of Health-Related Quality of Life Item Banks</article-title>. <source>Med Care</source> <year>2007</year>;<volume>45</volume>:<fpage>S22</fpage>–<lpage>31</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1097/01.mlr.0000250483.85507.04" xlink:type="simple">10.1097/01.mlr.0000250483.85507.04</ext-link></comment> <object-id pub-id-type="pmid">17443115</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref043"><label>43</label><mixed-citation publication-type="book" xlink:type="simple"><name name-style="western"><surname>Awang</surname> <given-names>Z.</given-names></name> <source>SEM Made Simple: A Gentle Approach to Learning Structural Equation Modeling</source>. <publisher-name>MPWS Rich Publication</publisher-name>; <year>2015</year>.</mixed-citation></ref>
<ref id="pone.0299947.ref044"><label>44</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Bentler</surname> <given-names>PM</given-names></name>. <article-title>Comparative fit indexes in structural models</article-title>. <source>Psychol Bull</source> <year>1990</year>;<volume>107</volume>:<fpage>238</fpage>–<lpage>46</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1037/0033-2909.107.2.238" xlink:type="simple">10.1037/0033-2909.107.2.238</ext-link></comment> <object-id pub-id-type="pmid">2320703</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref045"><label>45</label><mixed-citation publication-type="other" xlink:type="simple">Rosseel Y. lavaan: An R package for structural equation modeling and more Version 0.5–12 (BETA). 2012.</mixed-citation></ref>
<ref id="pone.0299947.ref046"><label>46</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Bandalos</surname> <given-names>DL</given-names></name>. <article-title>Relative Performance of Categorical Diagonally Weighted Least Squares and Robust Maximum Likelihood Estimation</article-title>. <source>Structural Equation Modeling</source> <year>2014</year>;<volume>21</volume>:<fpage>102</fpage>–<lpage>16</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1080/10705511.2014.859510" xlink:type="simple">10.1080/10705511.2014.859510</ext-link></comment></mixed-citation></ref>
<ref id="pone.0299947.ref047"><label>47</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Forero</surname> <given-names>CG</given-names></name>, <name name-style="western"><surname>Maydeu-Olivares</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Gallardo-Pujol</surname> <given-names>D</given-names></name>. <article-title>Factor Analysis with Ordinal Indicators: A Monte Carlo Study Comparing DWLS and ULS Estimation</article-title>. <source>Struct Equ Modeling</source> <year>2009</year>;<volume>16</volume>:<fpage>625</fpage>–<lpage>41</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1080/10705510903203573" xlink:type="simple">10.1080/10705510903203573</ext-link></comment></mixed-citation></ref>
<ref id="pone.0299947.ref048"><label>48</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Muthén</surname> <given-names>LK</given-names></name>, <name name-style="western"><surname>Muthén</surname> <given-names>BO</given-names></name>. <source>Statistical Analysis With Latent Variables User’s Guide</source>. <year>1998</year>.</mixed-citation></ref>
<ref id="pone.0299947.ref049"><label>49</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kim</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Oshima</surname> <given-names>TC</given-names></name>. <source>Effect of Multiple Testing Adjustment in Differential Item Functioning Detection</source>: <year>2012</year>;<volume>73</volume>:<fpage>458</fpage>–<lpage>70</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1177/0013164412467033" xlink:type="simple">10.1177/0013164412467033</ext-link></comment></mixed-citation></ref>
<ref id="pone.0299947.ref050"><label>50</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Benjamini</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Hochberg</surname> <given-names>Y</given-names></name>. <article-title>Controlling the False Discovery Rate: A Practical and Powerful Approach to Multiple Testing</article-title>. <source>Journal of the Royal Statistical Society: Series B (Methodological)</source> <year>1995</year>;<volume>57</volume>:<fpage>289</fpage>–<lpage>300</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/J.2517-6161.1995.TB02031.X" xlink:type="simple">10.1111/J.2517-6161.1995.TB02031.X</ext-link></comment></mixed-citation></ref>
<ref id="pone.0299947.ref051"><label>51</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Collins</surname> <given-names>GS</given-names></name>, <name name-style="western"><surname>Reitsma</surname> <given-names>JB</given-names></name>, <name name-style="western"><surname>Altman</surname> <given-names>DG</given-names></name>, <name name-style="western"><surname>Moons</surname> <given-names>KGM</given-names></name>. <article-title>Transparent Reporting of a multivariable prediction model for Individual Prognosis Or Diagnosis (TRIPOD): The TRIPOD Statement</article-title>. <source>British Journal of Surgery</source> <year>2015</year>;<volume>102</volume>:<fpage>148</fpage>–<lpage>58</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/bjs.9736" xlink:type="simple">10.1002/bjs.9736</ext-link></comment> <object-id pub-id-type="pmid">25627261</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref052"><label>52</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Vabalas</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Gowen</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Poliakoff</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Casson</surname> <given-names>AJ</given-names></name>. <article-title>Machine learning algorithm validation with a limited sample size</article-title>. <source>PLoS One</source> <year>2019</year>;<volume>14</volume>:<fpage>e0224365</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pone.0224365" xlink:type="simple">10.1371/journal.pone.0224365</ext-link></comment> <object-id pub-id-type="pmid">31697686</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref053"><label>53</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Varma</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Simon</surname> <given-names>R</given-names></name>. <article-title>Bias in error estimation when using cross-validation for model selection</article-title>. <source>BMC Bioinformatics</source> <year>2006</year>;<volume>7</volume>:<fpage>91</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2105-7-91" xlink:type="simple">10.1186/1471-2105-7-91</ext-link></comment> <object-id pub-id-type="pmid">16504092</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref054"><label>54</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Chawla</surname> <given-names>N V.</given-names></name>, <name name-style="western"><surname>Bowyer</surname> <given-names>KW</given-names></name>, <name name-style="western"><surname>Hall</surname> <given-names>LO</given-names></name>, <name name-style="western"><surname>Kegelmeyer</surname> <given-names>WP</given-names></name>. <article-title>SMOTE: Synthetic minority over-sampling technique</article-title>. <source>Journal of Artificial Intelligence Research</source> <year>2002</year>;<volume>16</volume>:<fpage>321</fpage>–<lpage>57</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1613/jair.953" xlink:type="simple">10.1613/jair.953</ext-link></comment></mixed-citation></ref>
<ref id="pone.0299947.ref055"><label>55</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Ma</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Fan</surname> <given-names>S</given-names></name>. <article-title>CURE-SMOTE algorithm and hybrid algorithm for feature selection and parameter optimization based on random forests</article-title>. <source>BMC Bioinformatics</source> <year>2017</year>;<volume>18</volume>:<fpage>169</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/s12859-017-1578-z" xlink:type="simple">10.1186/s12859-017-1578-z</ext-link></comment> <object-id pub-id-type="pmid">28292263</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref056"><label>56</label><mixed-citation publication-type="other" xlink:type="simple">Venables W, R DS-AI to, Version undefined, 2003 undefined. The R development core team. MusicbrainzOrg n.d.</mixed-citation></ref>
<ref id="pone.0299947.ref057"><label>57</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kuhn</surname> <given-names>M.</given-names></name> <article-title>Building Predictive Models in R Using the caret Package</article-title>. <source>J Stat Softw</source> <year>2008</year>.</mixed-citation></ref>
<ref id="pone.0299947.ref058"><label>58</label><mixed-citation publication-type="other" xlink:type="simple">Torgo L, Network MT. Package “DMwR.” UaemMx 2013.</mixed-citation></ref>
<ref id="pone.0299947.ref059"><label>59</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Rajput</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>WJ</given-names></name>, <name name-style="western"><surname>Chen</surname> <given-names>CC</given-names></name>. <article-title>Evaluation of a decided sample size in machine learning applications</article-title>. <source>BMC Bioinformatics</source> <year>2023</year>;<volume>24</volume>:<fpage>1</fpage>–<lpage>17</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/S12859-023-05156-9/FIGURES/5" xlink:type="simple">10.1186/S12859-023-05156-9/FIGURES/5</ext-link></comment></mixed-citation></ref>
<ref id="pone.0299947.ref060"><label>60</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Pang</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Tao</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Zhi</surname> <given-names>Q</given-names></name>, <name name-style="western"><surname>Zhang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Lin</surname> <given-names>H</given-names></name>. <article-title>A New Model for Caries Risk Prediction in Teenagers Using a Machine Learning Algorithm Based on Environmental and Genetic Factors</article-title>. <source>Front Genet</source> <year>2021</year>;<volume>12</volume>:<fpage>636867</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fgene.2021.636867" xlink:type="simple">10.3389/fgene.2021.636867</ext-link></comment> <object-id pub-id-type="pmid">33777105</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref061"><label>61</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kim</surname> <given-names>JM</given-names></name>, <name name-style="western"><surname>Choi</surname> <given-names>JS</given-names></name>, <name name-style="western"><surname>Choi</surname> <given-names>YH</given-names></name>, <name name-style="western"><surname>Kim</surname> <given-names>HE</given-names></name>. <article-title>Simplified Prediction Model for Accurate Assessment of Dental Caries Risk among Participants Aged 10–18 Years</article-title>. <source>Tohoku J Exp Med</source> <year>2018</year>;<volume>246</volume>:<fpage>81</fpage>–<lpage>6</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1620/tjem.246.81" xlink:type="simple">10.1620/tjem.246.81</ext-link></comment> <object-id pub-id-type="pmid">30333362</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref062"><label>62</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Abanto</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Celiberti</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Braga</surname> <given-names>MM</given-names></name>, <name name-style="western"><surname>Vidigal</surname> <given-names>EA</given-names></name>, <name name-style="western"><surname>Cordeschi</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Haddad</surname> <given-names>AE</given-names></name>, <etal>et al</etal>. <article-title>Effectiveness of a preventive program based on caries risk assessment and recall intervals on the incidence and regression of initial caries lesions in children</article-title>. <source>Int J Paediatr Dent</source> <year>2015</year>;<volume>25</volume>:<fpage>291</fpage>–<lpage>9</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/ipd.12144" xlink:type="simple">10.1111/ipd.12144</ext-link></comment> <object-id pub-id-type="pmid">25413129</object-id></mixed-citation></ref>
<ref id="pone.0299947.ref063"><label>63</label><mixed-citation publication-type="other" xlink:type="simple">Abanto J, Berti G, … LM-R-RG, 2016 undefined. Monitoring of caries disease by risk assessments and activity. SciELO Brasil n.d.</mixed-citation></ref>
</ref-list>
</back>
</article>