<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article article-type="research-article" dtd-version="1.1d3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">plosone</journal-id>
<journal-title-group>
<journal-title>PLOS ONE</journal-title>
</journal-title-group>
<issn pub-type="epub">1932-6203</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, CA USA</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">PONE-D-21-11415</article-id>
<article-id pub-id-type="doi">10.1371/journal.pone.0258214</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Research Article</subject>
</subj-group>
<subj-group subj-group-type="Discipline-v3">
<subject>Research and analysis methods</subject><subj-group><subject>Imaging techniques</subject><subj-group><subject>Neuroimaging</subject><subj-group><subject>Positron emission tomography</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Neuroimaging</subject><subj-group><subject>Positron emission tomography</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Diagnostic medicine</subject><subj-group><subject>Diagnostic radiology</subject><subj-group><subject>Tomography</subject><subj-group><subject>Positron emission tomography</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Research and analysis methods</subject><subj-group><subject>Imaging techniques</subject><subj-group><subject>Diagnostic radiology</subject><subj-group><subject>Tomography</subject><subj-group><subject>Positron emission tomography</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Radiology and imaging</subject><subj-group><subject>Diagnostic radiology</subject><subj-group><subject>Tomography</subject><subj-group><subject>Positron emission tomography</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Research and analysis methods</subject><subj-group><subject>Imaging techniques</subject><subj-group><subject>Neuroimaging</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Neuroimaging</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Mental health and psychiatry</subject><subj-group><subject>Dementia</subject><subj-group><subject>Alzheimer's disease</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Neurology</subject><subj-group><subject>Dementia</subject><subj-group><subject>Alzheimer's disease</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Medical conditions</subject><subj-group><subject>Neurodegenerative diseases</subject><subj-group><subject>Alzheimer's disease</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Neurology</subject><subj-group><subject>Neurodegenerative diseases</subject><subj-group><subject>Alzheimer's disease</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Computer and information sciences</subject><subj-group><subject>Software engineering</subject><subj-group><subject>Preprocessing</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Engineering and technology</subject><subj-group><subject>Software engineering</subject><subj-group><subject>Preprocessing</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Computer and information sciences</subject><subj-group><subject>Data management</subject><subj-group><subject>Data visualization</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Social sciences</subject><subj-group><subject>Sociology</subject><subj-group><subject>Education</subject><subj-group><subject>Training (education)</subject><subj-group><subject>Retraining</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Computer and information sciences</subject><subj-group><subject>Data acquisition</subject></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject></subj-group></article-categories>
<title-group>
<article-title>Performance evaluation in [<sup>18</sup>F]Florbetaben brain PET images classification using 3D Convolutional Neural Network</article-title>
<alt-title alt-title-type="running-head">Performance evaluation in brain PET images classification using 3D CNN</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0002-1779-1801</contrib-id>
<name name-style="western">
<surname>Lee</surname> <given-names>Seung-Yeon</given-names></name>
<role content-type="http://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="http://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role content-type="http://credit.niso.org/contributor-roles/software/">Software</role>
<role content-type="http://credit.niso.org/contributor-roles/validation/">Validation</role>
<role content-type="http://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-original-draft/">Writing – original draft</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Kang</surname> <given-names>Hyeon</given-names></name>
<role content-type="http://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="http://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role content-type="http://credit.niso.org/contributor-roles/validation/">Validation</role>
<role content-type="http://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0002-8954-3559</contrib-id>
<name name-style="western">
<surname>Jeong</surname> <given-names>Jong-Hun</given-names></name>
<role content-type="http://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="http://credit.niso.org/contributor-roles/software/">Software</role>
<role content-type="http://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-original-draft/">Writing – original draft</role>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0003-1688-0818</contrib-id>
<name name-style="western">
<surname>Kang</surname> <given-names>Do-young</given-names></name>
<role content-type="http://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="http://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="http://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role content-type="http://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role content-type="http://credit.niso.org/contributor-roles/resources/">Resources</role>
<role content-type="http://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role content-type="http://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
</contrib-group>
<aff id="aff001">
<label>1</label>
<addr-line>Department of Translational Biomedical Sciences, Dong-A University, Busan, Korea</addr-line>
</aff>
<aff id="aff002">
<label>2</label>
<addr-line>Institute of Convergence Bio-Health, Dong-A University, Busan, Korea</addr-line>
</aff>
<aff id="aff003">
<label>3</label>
<addr-line>DEEPNOID Inc., Seoul, Korea</addr-line>
</aff>
<aff id="aff004">
<label>4</label>
<addr-line>Department of Nuclear Medicine, Dong-A University Medical Center, Busan, Korea</addr-line>
</aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple">
<name name-style="western">
<surname>Alongi</surname> <given-names>Pierpaolo</given-names></name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/>
</contrib>
</contrib-group>
<aff id="edit1">
<addr-line>Fondazione Istituto G.Giglio di Cefalu, ITALY</addr-line>
</aff>
<author-notes>
<fn fn-type="conflict" id="coi001">
<p>The authors have declared that no competing interests exist.</p>
</fn>
<corresp id="cor001">* E-mail: <email xlink:type="simple">dykang@dau.ac.kr</email></corresp>
</author-notes>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<pub-date pub-type="epub">
<day>20</day>
<month>10</month>
<year>2021</year>
</pub-date>
<volume>16</volume>
<issue>10</issue>
<elocation-id>e0258214</elocation-id>
<history>
<date date-type="received">
<day>8</day>
<month>4</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>21</day>
<month>9</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-year>2021</copyright-year>
<copyright-holder>Lee et al</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.1371/journal.pone.0258214"/>
<abstract>
<p>High accuracy has been reported in deep learning classification for amyloid brain scans, an important factor in Alzheimer’s disease diagnosis. However, the possibility of overfitting should be considered, as this model is fitted with sample data. Therefore, we created and evaluated an [<sup>18</sup>F]Florbetaben amyloid brain positron emission tomography (PET) scan classification model with a Dong-A University Hospital (DAUH) dataset based on a convolutional neural network (CNN), and performed external validation with the Alzheimer’s Disease Neuroimaging Initiative dataset. Spatial normalization, count normalization, and skull stripping preprocessing were performed on the DAUH and external datasets. However, smoothing was only performed on the external dataset. Three types of models were used, depending on their structure: Inception3D, ResNet3D, and VGG3D. After training with 80% of the DAUH dataset, an appropriate model was selected, and the rest of the DAUH dataset was used for model evaluation. The generalization potential of the selected model was then validated using the external dataset. The accuracy of the model evaluation for Inception3D, ResNet3D, and VGG3D was 95.4%, 92.0%, and 97.7%, and the accuracy of the external validation was 76.7%, 67.1%, and 85.3%, respectively. Inception3D and ResNet3D were retrained with the external dataset; then, the area under the curve was compared to determine the binary classification performance with a significance level of less than 0.05. When external validation was performed again after fine tuning, the performance improved to 15.3%p for Inception3D and 16.9%p for ResNet3D. In [<sup>18</sup>F]Florbetaben amyloid brain PET scan classification using CNN, the generalization potential can be seen through external validation. When there is a significant difference between the model classification performance and the external validation, changing the model structure or fine tuning the model can help improve the classification performance, and the optimal model can also be found by collaborating through a web-based open platform.</p>
</abstract>
<funding-group>
<award-group id="award001">
<funding-source>
<institution>National Research Foundation of Korea (KR)</institution>
</funding-source>
<award-id>NRF-2018 R1A2B2008178</award-id>
<principal-award-recipient>
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0003-1688-0818</contrib-id>
<name name-style="western">
<surname>Kang</surname> <given-names>Do-young</given-names>
</name>
</principal-award-recipient>
</award-group>
<funding-statement>This work was supported by the Dong-A University research fund. The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement>
</funding-group>
<counts>
<fig-count count="11"/>
<table-count count="6"/>
<page-count count="16"/>
</counts>
<custom-meta-group>
<custom-meta id="data-availability">
<meta-name>Data Availability</meta-name>
<meta-value>All relevant data are available on Figshare: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.6084/m9.figshare.16702519.v1" xlink:type="simple">https://doi.org/10.6084/m9.figshare.16702519.v1</ext-link>.</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="sec001" sec-type="intro">
<title>1 Introduction</title>
<p>Alzheimer’s disease (AD) is a progressive and irreversible neurodegenerative disease in which a patient gradually loses memory, mental function, and the ability to continue daily activities [<xref ref-type="bibr" rid="pone.0258214.ref001">1</xref>]. As there is no effective treatment for AD, an accurate diagnosis is essential for developing the patient’s future treatment plan. Neuroimaging technology using AD-related biomarkers is widely used to increase the reliability of AD diagnosis [<xref ref-type="bibr" rid="pone.0258214.ref002">2</xref>]. Radiotracers are among the types of biomarkers that can be injected into the subject’s body and observed via PET. Representative radiotracers used to diagnose AD include 2-[<sup>18</sup>F]fluoro-D-glucose, which can identify the degree of brain metabolism, and [<sup>18</sup>F]Florbetaben, [<sup>18</sup>F]Florbetapir and [<sup>18</sup>F]Flutemetamol which can observe brain amyloid plaque load.</p>
<p>According to specific or diagnostic criteria [<xref ref-type="bibr" rid="pone.0258214.ref003">3</xref>–<xref ref-type="bibr" rid="pone.0258214.ref005">5</xref>], several systems apply brain PET scans to machine learning and deep learning models to train, evaluate, and classify images. Moreover, there is also recent work using them on automatic and semi-automatic segmentation algorithms in PET [<xref ref-type="bibr" rid="pone.0258214.ref006">6</xref>, <xref ref-type="bibr" rid="pone.0258214.ref007">7</xref>]. In one study, an AD diagnosis classifier using PCA and SVM was utilized after image dimension reduction of [<sup>18</sup>F]Florbetaben brain PET images [<xref ref-type="bibr" rid="pone.0258214.ref008">8</xref>], and in another, images were classified according to amyloid deposition with an accuracy of 89% [<xref ref-type="bibr" rid="pone.0258214.ref009">9</xref>] using Visual Geometry Group (VGG) 16 [<xref ref-type="bibr" rid="pone.0258214.ref010">10</xref>], which is a well-known structure among convolutional neural networks (CNN) [<xref ref-type="bibr" rid="pone.0258214.ref011">11</xref>, <xref ref-type="bibr" rid="pone.0258214.ref012">12</xref>] that specializes in image feature extraction using deep learning technology.</p>
<p>Meanwhile, because of the nature of medical images, acquisition costs can be high; thus, it is not easy to construct a large dataset. When a model is trained and tested with a limited number of datasets, to confirm the generalization possibility, it is necessary to configure an external dataset that is different from the source of the training dataset and to validate its potential.</p>
<p>Previous studies, such as the external validation of pancreatic cancer from CT images [<xref ref-type="bibr" rid="pone.0258214.ref013">13</xref>] and the external validation of malignancy risk prediction of lung nodules [<xref ref-type="bibr" rid="pone.0258214.ref014">14</xref>], have been reported. It is necessary to apply the validation process to brain imaging to build a model and then to externally validate the model with the same type of brain images obtained from other sites.</p>
<p>In this study, brain PET scans of [<sup>18</sup>F]Florbetaben, a diagnostic radiotracer that visualizes the classification of <italic>β</italic>-amyloid (A<italic>β</italic>), the main component of amyloid plaques found in the brain, were acquired from Dong-A University Hospital (DAUH) and used to construct a dataset. We created models that receive 3D voxel input by deriving characteristic structures from the well-known CNN structures Inception, VGG, and ResNet. We then selected one representative model for each structure after training according to the model selection criteria. With this model, the images acquired from the Alzheimer’s Disease Neuroimaging Initiative (ADNI) were used as a dataset and externally validated to examine the possibility of generalization.</p>
</sec>
<sec id="sec002" sec-type="materials|methods">
<title>2 Materials and methods</title>
<sec id="sec003">
<title>2.1 Data acquisition</title>
<p>The DAUH dataset, listed in <xref ref-type="table" rid="pone.0258214.t001">Table 1</xref>, comprises a total of 432 subjects according to the visually assessed criteria of [<sup>18</sup>F]Florbetaben PET. An available database was collected from 2015 to 2020 from the Department of Nuclear Medicine at DAUH for a possible population of [<sup>18</sup>F]Florbetaben PET. Labeling for A<italic>β</italic> negative and positive was performed according to the decision of a nuclear medicine specialist at DAUH.</p>
<table-wrap id="pone.0258214.t001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.t001</object-id>
<label>Table 1</label>
<caption>
<title>Demographics and positivity of study participants according to each dataset group.</title>
</caption>
<alternatives>
<graphic id="pone.0258214.t001g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.t001" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="center">Dataset</th>
<th align="center" colspan="2">DAUH</th>
<th align="center" colspan="2">External</th>
</tr>
<tr>
<th align="center">n</th>
<th align="center" colspan="2">432</th>
<th align="center" colspan="2">251</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center">Visual Assessment</td>
<td align="center">Negative</td>
<td align="center">Positive</td>
<td align="center">Negative</td>
<td align="center">Positive</td>
</tr>
<tr>
<td align="center">Subjects</td>
<td align="center">191</td>
<td align="center">241</td>
<td align="center">142</td>
<td align="center">109</td>
</tr>
<tr>
<td align="center">Age</td>
<td align="center">68.1</td>
<td align="center">69.9</td>
<td align="center">70.8</td>
<td align="center">73.7</td>
</tr>
<tr>
<td align="center">Sex, male %</td>
<td align="center">35.6</td>
<td align="center">44.4</td>
<td align="center">40.8</td>
<td align="center">56.9</td>
</tr>
<tr>
<td align="center">Education</td>
<td align="center">9.1</td>
<td align="center">10</td>
<td align="center">16.1</td>
<td align="center">16</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<p>PET scans of the possible population were acquired using a Biograph 40 mCT Flow PET/CT Scanner (Siemens Healthcare, Knoxville, TN, USA) and reconstructed via UltraHD-PET (TrueX-TOF) to obtain PET images, and the obtained images were processed with a 3mm FWHM Gaussian filter. All patients underwent a 20 min positron emission scan at 90 min after intravenous injection of 300mBq of [<sup>18</sup>F]Florbetaben (NeuraCeq, Piramal, Mumbai, India), and the helical CT scans were acquired with a 0.5 s rotation time at 100 kVp and 228 mAs. The images were finally stored in the DICOM format.</p>
<p>Finally, [<sup>18</sup>F]Florbetaben PET images collected from the Alzheimer’s Neuroimaging Initiative (ADNI) database (<ext-link ext-link-type="uri" xlink:href="https://www.loni.ucla.edu/ADNI" xlink:type="simple">www.loni.ucla.edu/ADNI</ext-link>) were used as an external dataset in this study. The database includes scans of subjects with normal control, mild cognitive impairment (MCI), and AD. These scans were preprocessed as an ADNI internal protocol and co-registration, averaging, size changing, standardization, and smoothing processes were performed. However, since ADNI does not determine whether the [<sup>18</sup>F]Florbetaben scans are A<italic>β</italic> negative or positive, classification was performed by the nuclear medicine specialists at DAUH.</p>
<p>Unlike the DAUH dataset, images from the external dataset were not processed with 3 mm FWHM Gaussian filters. To achieve the same conditions, a 3 mm FWHM Gaussian filter was used to process the statistical parametric mapping (SPM) after the acquisition. An example of Gaussian filter processing is shown in <xref ref-type="fig" rid="pone.0258214.g001">Fig 1</xref>.</p>
<fig id="pone.0258214.g001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.g001</object-id>
<label>Fig 1</label>
<caption>
<title>Smoothing of the external data.</title>
<p>After the smoothing process, an image in which noise is reduced can be obtained.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.g001" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec004">
<title>2.2 Image preprocessing in common</title>
<p>We performed spatial normalization and count normalization to classify A<italic>β</italic> deposition using brain PET. We used the SPM library [<xref ref-type="bibr" rid="pone.0258214.ref015">15</xref>] based on MATLAB. All dataset groups applied the same preprocessing procedure using the same protocol, even if there were differences in the source and collection times.</p>
<p>Spatial normalization is the registration of the original image to a specific PET template. Subjects with various brain shapes can be compared through image registration by mapping the subject’s PET image to a reference brain template [<xref ref-type="bibr" rid="pone.0258214.ref016">16</xref>].</p>
<p>Meanwhile, we made a reference brain PET template in-house. Co-registration was performed with a PET image and a paired CT image obtained from a subject. The template images are average images of 20 normal brains, 20 Alzheimer’s dementia brains, and 40 left and right inversion images, for a total of 80 images. After image registration, the tissue is stretched or compressed to fit the template brain. We can average the PETs of multiple individuals to reconstruct them into a reference brain space and provide atlas anatomical addresses mapped to the same reference brain space at the data locations in the image. We also performed a cropping process that cuts the empty space around the brain, reducing its size from 400 × 400 × 110 to 95 × 79 × 68.</p>
<p>Count normalization is intended for numerical comparisons between images because the image intensity level varies due to differences in the number of radioactive isotopes administered, individual characteristics, or individual body conditions. This normalization was performed assuming that the absorption of radioactive tracers in a brain region is constant for each person. Count normalization normalizes the entire observation area to the value of the area representing non-specific, lesion-independent absorption, allowing absolute and relative comparisons in specific absorption areas of the patient-patient image [<xref ref-type="bibr" rid="pone.0258214.ref017">17</xref>].</p>
<p>The [<sup>18</sup>F]Florbetaben radiotracer exhibits non-specific uptake in the cerebellar region and specific uptake in the gray matter region of the cerebrum; thus, count normalization was performed by using the cerebellar region of the PET template applied in spatial normalization to each patient image.</p>
<p>In addition, the skull, a non-brain tissue, is included in the image because it is spatially normalized with a CT-driven PET template. The presence of these non-brain tissues is considered an obstacle in brain image analysis. Therefore, in brain imaging analysis studies, a preprocessing commonly referred to as skull stripping is required [<xref ref-type="bibr" rid="pone.0258214.ref018">18</xref>].</p>
<p>In the [<sup>18</sup>F]Florbetaben amyloid brain PET classification model, spatial normalization, count normalization, and skull stripping are commonly performed for all datasets, and an example of a brain PET scan image that has been preprocessed is shown in <xref ref-type="fig" rid="pone.0258214.g002">Fig 2</xref>.</p>
<fig id="pone.0258214.g002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.g002</object-id>
<label>Fig 2</label>
<caption>
<title>Commonly applied preprocessing.</title>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.g002" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec005">
<title>2.3 Model architecture</title>
<p>In this study, we apply CNNs of three well-known architectures to the amyloid classification problem in [<sup>18</sup>F]Florbetaben brain PET. The architectures considered are Inception [<xref ref-type="bibr" rid="pone.0258214.ref019">19</xref>, <xref ref-type="bibr" rid="pone.0258214.ref020">20</xref>], ResNet [<xref ref-type="bibr" rid="pone.0258214.ref021">21</xref>], and VGG19 [<xref ref-type="bibr" rid="pone.0258214.ref010">10</xref>]. The reasons for choosing these models were to achieve the best performance in various tasks, use a small kernel (3 × 3) [<xref ref-type="bibr" rid="pone.0258214.ref010">10</xref>] instead of a large kernel, utilize a deep but sparse network structure [<xref ref-type="bibr" rid="pone.0258214.ref019">19</xref>], and provide residual connectivity [<xref ref-type="bibr" rid="pone.0258214.ref021">21</xref>]. We implemented the model ourselves by adopting parts of the primary characteristics of these structures and applying 3D convolution filter. Each representative structure is shown in <xref ref-type="fig" rid="pone.0258214.g003">Fig 3</xref>.</p>
<fig id="pone.0258214.g003" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.g003</object-id>
<label>Fig 3</label>
<caption>
<title>Primary structure of the models.</title>
<p>(a) and (b) are the most characteristic parts of the structure, and (c) is the overall structure of the model. The ‘×2’ written on the side means that the process is repeated as many times as the number.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.g003" xlink:type="simple"/>
</fig>
<p>To briefly summarize the meaning of each layer:</p>
<list list-type="bullet">
<list-item>
<p>Conv3D: 3D convolution kernel layer.</p>
</list-item>
<list-item>
<p>BatchNormalization: To avoid gradient vanishing problems due to structural complexity and speed up the training [<xref ref-type="bibr" rid="pone.0258214.ref022">22</xref>].</p>
</list-item>
<list-item>
<p>Activation: When the data that has passed through the layer is transmitted to the next layer, it plays a role in determining whether to transmit the input data according to a specific criterion, and all model structures in this study apply the Rectifier Linear Unit (ReLU) [<xref ref-type="bibr" rid="pone.0258214.ref023">23</xref>] activation function.</p>
</list-item>
<list-item>
<p>Concatenate: To connect data horizontally.</p>
</list-item>
<list-item>
<p>Pooling: Also known as sub-sampling, the image is reduced by selecting a large value or taking an average in the corresponding receptive field.</p>
</list-item>
<list-item>
<p>Dropout: Only certain weights are kept at a certain probability and the remaining connected units are diluted. This is known to prevent network overfitting [<xref ref-type="bibr" rid="pone.0258214.ref024">24</xref>].</p>
</list-item>
</list>
<p>Recently, 3D CNN research has been actively conducted to extract features of 3D medical images for classification [<xref ref-type="bibr" rid="pone.0258214.ref025">25</xref>]. Moreover, because brain images are volume data, 3D CNNs can be configured for image classification to extract 3D spatial features from 3D PET images. Accordingly, Inception, ResNet, and VGG models are constructed in the form of a 3D CNN and are named Inception3D, ResNet3D, and VGG3D in our experiment.</p>
</sec>
<sec id="sec006">
<title>2.4 Model selection and evaluation</title>
<p>Eighty percent of the DAUH dataset, as shown in <xref ref-type="fig" rid="pone.0258214.g004">Fig 4</xref>, was used for model training and the rest is used for model evaluation. The samples were splitted with Stratified ShuffleSplit cross-validator (<ext-link ext-link-type="uri" xlink:href="https://scikit-learn.org/stable/modules/generated/sklearn.model_selection.StratifiedShuffleSplit.html" xlink:type="simple">https://scikit-learn.org/stable/modules/generated/sklearn.model_selection.StratifiedShuffleSplit.html</ext-link>), which was randomly extracted from each group labeled amyloid positive and negative. Along with the training set, there was also a validation set used to ensure that the model is trained well. This is explained in more detail in <xref ref-type="fig" rid="pone.0258214.g005">Fig 5</xref>.</p>
<fig id="pone.0258214.g004" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.g004</object-id>
<label>Fig 4</label>
<caption>
<title>DAUH and external datasets for model training and validation.</title>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.g004" xlink:type="simple"/>
</fig>
<fig id="pone.0258214.g005" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.g005</object-id>
<label>Fig 5</label>
<caption>
<title>Overall workflow.</title>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.g005" xlink:type="simple"/>
</fig>
<p>The model training was conducted by four-fold cross-validation with 192 amyloid positive subjects and 153 amyloid negative subjects from the DAUH dataset. If the dataset is small, the reliability of the performance evaluation is reduced. If the performance varies depending on how the validation set is held, the effect of the match will bias the model evaluation performance. To solve this, cross-validation ensures that all data are used as a validation set at least once.</p>
<p>As shown in <xref ref-type="fig" rid="pone.0258214.g006">Fig 6</xref>, the entire dataset can be divided into four subsets; the first subset is used as the validation set in the first iteration, and the remaining subsets are used as the training set. In the second iteration, the second subset is used as the validation set, and the remaining subsets are used as the training set. By repeating the number of subsets in this manner, we could select the lowest loss model out of the four performances.</p>
<fig id="pone.0258214.g006" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.g006</object-id>
<label>Fig 6</label>
<caption>
<title>Four-fold cross-validation for each iteration.</title>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.g006" xlink:type="simple"/>
</fig>
<p>All models of each structure were selected through four-fold cross-validation [<xref ref-type="bibr" rid="pone.0258214.ref026">26</xref>] and evaluated with the model evaluation set of the DAUH dataset specified in <xref ref-type="fig" rid="pone.0258214.g004">Fig 4</xref>.</p>
<p>In the external dataset, some samples were randomly extracted using the same sample extraction method. If the accuracy was significantly different between the model evaluation and the external validation, it is possible that a part of the external dataset could be included in the training set to acquire generalization performance. In that case, only a portion of the dataset was composed of the external validation set.</p>
</sec>
</sec>
<sec id="sec007" sec-type="results">
<title>3 Results</title>
<p>We investigated information about the model and the time required for each experiment. Specifications about the models can be viewed in <xref ref-type="table" rid="pone.0258214.t002">Table 2</xref>. Experiment time consists of training, image loading, and prediction using the validation set. The required time for each network is Inception3D 1.46hrs, ResNet3D 1.9hours, and VGG3D 1.90 hours. Inference time took about 0.24 seconds per subject, and all experiments were performed on a workstation with four NVIDIA Titan Xp GPUs.</p>
<table-wrap id="pone.0258214.t002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.t002</object-id>
<label>Table 2</label>
<caption>
<title>Specifications about the models.</title>
</caption>
<alternatives>
<graphic id="pone.0258214.t002g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.t002" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left"/>
<th align="center">Inception3D</th>
<th align="center">ResNet3D</th>
<th align="center">VGG3D</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center">Total params</td>
<td align="right">6,098,530</td>
<td align="right">17,620,196</td>
<td align="center">17,236,386</td>
</tr>
<tr>
<td align="center">Trainable params</td>
<td align="right">6,093,538</td>
<td align="right">17,612,642</td>
<td align="center">17,236,002</td>
</tr>
<tr>
<td align="center">Non-trainable params</td>
<td align="right">4,992</td>
<td align="right">7,554</td>
<td align="center">384</td>
</tr>
<tr>
<td align="center">Size on disk</td>
<td align="right">70</td>
<td align="right">202</td>
<td align="center">195</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<sec id="sec008">
<title>3.1 Data distribution</title>
<p>To confirm the data distribution of the preprocessed DAUH and external datasets before CNN-based analysis, as shown in <xref ref-type="fig" rid="pone.0258214.g007">Fig 7</xref>, t-SNE (Stochastic Neighbor Embedding) [<xref ref-type="bibr" rid="pone.0258214.ref027">27</xref>] visualization, which is widely used for visualization after a data dimension reduction, was performed. Although the sources of the datasets are different, the same groups have a similar distribution. In other words, data similarity was observed between the same groups.</p>
<fig id="pone.0258214.g007" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.g007</object-id>
<label>Fig 7</label>
<caption>
<title>Dataset distribution using t-SNE visualization.</title>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.g007" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec009">
<title>3.2 Model evaluation</title>
<p>The model evaluation results of the Inception3D, ResNet3D, and VGG3D models after training the models with the DAUH training dataset are summarized in <xref ref-type="table" rid="pone.0258214.t003">Table 3</xref>. To evaluate the performance of each model, three metrics were considered: sensitivity, specificity, and accuracy.</p>
<table-wrap id="pone.0258214.t003" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.t003</object-id>
<label>Table 3</label>
<caption>
<title>Classification evaluation metrics.</title>
</caption>
<alternatives>
<graphic id="pone.0258214.t003g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.t003" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="center" rowspan="2"/>
<th align="center" colspan="2">Inception3D</th>
<th align="center" colspan="2">ResNet3D</th>
<th align="center" colspan="2">VGG3D</th>
</tr>
<tr>
<th align="center">Model Evaluation</th>
<th align="center">External Validation</th>
<th align="center">Model Evaluation</th>
<th align="center">External Validation</th>
<th align="center">Model Evaluation</th>
<th align="center">External Validation</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center">AUC</td>
<td align="center">0.996</td>
<td align="center">0.883</td>
<td align="center">0.968</td>
<td align="center">0.901</td>
<td align="center">0.98</td>
<td align="center">0.945</td>
</tr>
<tr>
<td align="center">Sensitivity</td>
<td align="center">0.918</td>
<td align="center">0.845</td>
<td align="center">0.918</td>
<td align="center">0.944</td>
<td align="center">0.959</td>
<td align="center">0.831</td>
</tr>
<tr>
<td align="center">Specificity</td>
<td align="center">1</td>
<td align="center">0.707</td>
<td align="center">0.921</td>
<td align="center">0.469</td>
<td align="center">1</td>
<td align="center">0.945</td>
</tr>
<tr>
<td align="center">PPV</td>
<td align="center">1</td>
<td align="center">0.69</td>
<td align="center">0.938</td>
<td align="center">0.458</td>
<td align="center">1</td>
<td align="center">0.831</td>
</tr>
<tr>
<td align="center">NPV</td>
<td align="center">0.905</td>
<td align="center">0.855</td>
<td align="center">0.897</td>
<td align="center">0.918</td>
<td align="center">0.95</td>
<td align="center">0.87</td>
</tr>
<tr>
<td align="center">Accuracy</td>
<td align="center">0.954</td>
<td align="center">0.767</td>
<td align="center">0.92</td>
<td align="center">0.671</td>
<td align="center">0.977</td>
<td align="center">0.87</td>
</tr>
<tr>
<td align="center">Standard Deviation</td>
<td align="center">0.487</td>
<td align="center">0.452</td>
<td align="center">0.482</td>
<td align="center">0.351</td>
<td align="center">0.95</td>
<td align="center">0.853</td>
</tr>
<tr>
<td align="center">95% Confidence Interval</td>
<td align="center">0.950 to 1.000</td>
<td align="center">0.823 to 0.928</td>
<td align="center">0.907 to 0.994</td>
<td align="center">0.845 to 0.942</td>
<td align="center">0.923 to 0.998</td>
<td align="center">0.898 to 0.974</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<p>Sensitivity is the proportion of subjects who are inferred to be positive among all A<italic>β</italic>-positive subjects and is defined as follows:
<disp-formula id="pone.0258214.e001"><alternatives><graphic id="pone.0258214.e001g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0258214.e001" xlink:type="simple"/><mml:math display="block" id="M1"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>S</mml:mi> <mml:mi>e</mml:mi> <mml:mi>n</mml:mi> <mml:mi>s</mml:mi> <mml:mi>i</mml:mi> <mml:mi>t</mml:mi> <mml:mi>i</mml:mi> <mml:mi>v</mml:mi> <mml:mi>i</mml:mi> <mml:mi>t</mml:mi> <mml:mi>y</mml:mi> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:mi>T</mml:mi> <mml:mi>P</mml:mi></mml:mrow> <mml:mrow><mml:mi>T</mml:mi> <mml:mi>P</mml:mi> <mml:mo>+</mml:mo> <mml:mi>F</mml:mi> <mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
where TP represents the number of true positives and FN represents the number of false negatives.</p>
<p>Specificity is the proportion of subjects who are inferred to be negative among all A<italic>β</italic>-negative subjects and is defined as follows:
<disp-formula id="pone.0258214.e002"><alternatives><graphic id="pone.0258214.e002g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0258214.e002" xlink:type="simple"/><mml:math display="block" id="M2"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>S</mml:mi> <mml:mi>p</mml:mi> <mml:mi>e</mml:mi> <mml:mi>c</mml:mi> <mml:mi>i</mml:mi> <mml:mi>f</mml:mi> <mml:mi>i</mml:mi> <mml:mi>c</mml:mi> <mml:mi>i</mml:mi> <mml:mi>t</mml:mi> <mml:mi>y</mml:mi> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:mi>T</mml:mi> <mml:mi>N</mml:mi></mml:mrow> <mml:mrow><mml:mi>T</mml:mi> <mml:mi>N</mml:mi> <mml:mo>+</mml:mo> <mml:mi>F</mml:mi> <mml:mi>P</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
where TN represents the number of true negatives and FP indicates the number of false positives.</p>
<p>PPV(Positive Predictive Value) is the probability that those that come out A<italic>β</italic> positive actually have A<italic>β</italic> positive according to the ground truth. NPV(Negative Predictive Value) is the probability that those that come out A<italic>β</italic> negative actually have A<italic>β</italic> negative according to the ground truth.
<disp-formula id="pone.0258214.e003"><alternatives><graphic id="pone.0258214.e003g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0258214.e003" xlink:type="simple"/><mml:math display="block" id="M3"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>P</mml:mi> <mml:mi>P</mml:mi> <mml:mi>V</mml:mi> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:mi>T</mml:mi> <mml:mi>P</mml:mi></mml:mrow> <mml:mrow><mml:mi>T</mml:mi> <mml:mi>P</mml:mi> <mml:mo>+</mml:mo> <mml:mi>F</mml:mi> <mml:mi>P</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula> <disp-formula id="pone.0258214.e004"><alternatives><graphic id="pone.0258214.e004g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0258214.e004" xlink:type="simple"/><mml:math display="block" id="M4"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>N</mml:mi> <mml:mi>P</mml:mi> <mml:mi>V</mml:mi> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:mi>T</mml:mi> <mml:mi>N</mml:mi></mml:mrow> <mml:mrow><mml:mi>F</mml:mi> <mml:mi>N</mml:mi> <mml:mo>+</mml:mo> <mml:mi>T</mml:mi> <mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula></p>
<p>Accuracy is the degree of closeness between the predicted value and the actual value of the subjects. It is calculated as the number of true positives and negatives among all accurate and evaluated subjects as follows:
<disp-formula id="pone.0258214.e005"><alternatives><graphic id="pone.0258214.e005g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0258214.e005" xlink:type="simple"/><mml:math display="block" id="M5"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>A</mml:mi> <mml:mi>c</mml:mi> <mml:mi>c</mml:mi> <mml:mi>u</mml:mi> <mml:mi>r</mml:mi> <mml:mi>a</mml:mi> <mml:mi>c</mml:mi> <mml:mi>y</mml:mi> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:mi>T</mml:mi> <mml:mi>P</mml:mi> <mml:mo>+</mml:mo> <mml:mi>T</mml:mi> <mml:mi>N</mml:mi></mml:mrow> <mml:mrow><mml:mi>T</mml:mi> <mml:mi>P</mml:mi> <mml:mo>+</mml:mo> <mml:mi>F</mml:mi> <mml:mi>N</mml:mi> <mml:mo>+</mml:mo> <mml:mi>T</mml:mi> <mml:mi>N</mml:mi> <mml:mo>+</mml:mo> <mml:mi>F</mml:mi> <mml:mi>P</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula></p>
<p>We plotted the receiver operating characteristic (ROC) curve of our method for A<italic>β</italic> positivity, as shown in <xref ref-type="fig" rid="pone.0258214.g008">Fig 8</xref>, and calculated the area under the curve (AUC). The AUC value was close to 1 for all three models.</p>
<fig id="pone.0258214.g008" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.g008</object-id>
<label>Fig 8</label>
<caption>
<title>ROC curves for each model evaluation.</title>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.g008" xlink:type="simple"/>
</fig>
<p>
<xref ref-type="table" rid="pone.0258214.t004">Table 4</xref> summarizes the pairwise comparison results of ROC curves obtained from the Inception3D, ResNet3D, and VGG3D inferences that performed model evaluation. At the 95% significance level, since both p-values are greater than 0.05, the corresponding two comparison areas are not significantly different.</p>
<table-wrap id="pone.0258214.t004" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.t004</object-id>
<label>Table 4</label>
<caption>
<title>Comparison of ROC curves.</title>
</caption>
<alternatives>
<graphic id="pone.0258214.t004g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.t004" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<tbody>
<tr>
<td align="left" colspan="5">Pairwise comparison of ROC curves for each model evaluation</td>
</tr>
<tr>
<td align="left"/>
<td align="left">Difference between areas</td>
<td align="left">SE</td>
<td align="left">95% CI</td>
<td align="left">P-value</td>
</tr>
<tr>
<td align="left">Inception3D vs. ResNet3D</td>
<td align="left">0.0274</td>
<td align="left">0.0154</td>
<td align="left">-0.00282 to 0.0576</td>
<td align="left">0.0756</td>
</tr>
<tr>
<td align="left">Inception3D vs. VGG3D</td>
<td align="left">0.0161</td>
<td align="left">0.0208</td>
<td align="left">-0.0246 to 0.0569</td>
<td align="left">0.4384</td>
</tr>
<tr>
<td align="left">ResNet3D vs. VGG3D</td>
<td align="left">0.0113</td>
<td align="left">0.0203</td>
<td align="left">-0.0285 to 0.0510</td>
<td align="left">0.5780</td>
</tr>
<tr>
<td align="left" colspan="5">Comparison of independent ROC curves with the model evaluations and the external validations</td>
</tr>
<tr>
<td align="left">Inception3D</td>
<td align="left">0.113</td>
<td align="left">0.0266</td>
<td align="left">0.0610 to 0.165</td>
<td align="left">&lt;0.05</td>
</tr>
<tr>
<td align="left">ResNet3D</td>
<td align="left">0.0672</td>
<td align="left">0.0306</td>
<td align="left">0.00733 to 0.127</td>
<td align="left">&lt;0.05</td>
</tr>
<tr>
<td align="left">VGG3D</td>
<td align="left">0.0349</td>
<td align="left">0.0269</td>
<td align="left">-0.0179 to 0.0876</td>
<td align="left">0.1950</td>
</tr>
</tbody>
</table>
</alternatives>
<table-wrap-foot>
<fn id="t004fn001">
<p>Note. SE = standard error, CI = confidence interval</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="sec010">
<title>3.3 External validation</title>
<p>With respect to accuracy and AUC, VGG3D showed the best classification performance. As summarized in <xref ref-type="table" rid="pone.0258214.t003">Table 3</xref>, the AUC of the external validations was lower than that of the model evaluation, and a comparison of the p-values summarized in <xref ref-type="table" rid="pone.0258214.t004">Table 4</xref> indicates that Inception3D and ResNet3D were below the significance level; thus, there were significant differences in the performance evaluation. However, there was no significant difference between the model evaluation and the external validation for the VGG model, as shown by the significance level, p = 0.1950. The ROC curves of the comparison are plotted in <xref ref-type="fig" rid="pone.0258214.g009">Fig 9</xref>.</p>
<fig id="pone.0258214.g009" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.g009</object-id>
<label>Fig 9</label>
<caption>
<title>ROC curve comparison for each model.</title>
<p>In the legend of each plot, ‘<italic>ext</italic>_<italic>val</italic>’ means the external validation, and ‘<italic>model</italic>_<italic>eval</italic>’ means the model evaluation.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.g009" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec011">
<title>3.4 Retraining model</title>
<p>This is a method of redefining the model to create a generalized model by additionally retraining a part of the external dataset to the model trained with the DAUH training set. In this part, excluding the external validation set shown in <xref ref-type="fig" rid="pone.0258214.g004">Fig 4</xref>, the 38 A<italic>β</italic> positives and 50 A<italic>β</italic> negatives were configured as a retraining set for fine tuning. the pre-trained model was imported as it is, and all layers were retrained.</p>
<p>As summarized in <xref ref-type="table" rid="pone.0258214.t005">Table 5</xref>, when the external validation was performed, the classification performance was improved compared to before retraining. The evaluation performance of the models trained with DAUH was compared with that of models additionally retrained with the residue of the external datasets by independent ROC. Both evaluation performances were within the 95% confidence level (Inception3D: 0.5124, ResNet3D: 0.3247), as shown in <xref ref-type="table" rid="pone.0258214.t006">Table 6</xref>. No significant difference was observed between the two evaluations for each model, and the ROC curves are shown in <xref ref-type="fig" rid="pone.0258214.g010">Fig 10</xref>.</p>
<table-wrap id="pone.0258214.t005" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.t005</object-id>
<label>Table 5</label>
<caption>
<title>External validation after model retraining.</title>
</caption>
<alternatives>
<graphic id="pone.0258214.t005g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.t005" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left"/>
<th align="center">Inception3D</th>
<th align="center">ResNet3D</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center">AUC</td>
<td align="char" char=".">0.95</td>
<td align="char" char=".">0.943</td>
</tr>
<tr>
<td align="center">Sensitivity</td>
<td align="char" char=".">0.845</td>
<td align="char" char=".">0.915</td>
</tr>
<tr>
<td align="center">Specificity</td>
<td align="char" char=".">0.967</td>
<td align="char" char=".">0.783</td>
</tr>
<tr>
<td align="center">Accuracy</td>
<td align="char" char=".">0.92</td>
<td align="char" char=".">0.84</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<table-wrap id="pone.0258214.t006" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.t006</object-id>
<label>Table 6</label>
<caption>
<title>Comparison of independent ROC curves with the model evaluations and the external validations after retraining.</title>
</caption>
<alternatives>
<graphic id="pone.0258214.t006g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.t006" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left"/>
<th align="center">Difference between areas</th>
<th align="center">SE</th>
<th align="center">95% CI</th>
<th align="center">P-value</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left">Inception3D</td>
<td align="char" char=".">0.0185</td>
<td align="char" char=".">0.0283</td>
<td align="center">-0.0369 to 0.0740</td>
<td align="char" char=".">0.5124</td>
</tr>
<tr>
<td align="left">ResNet3D</td>
<td align="char" char=".">0.0251</td>
<td align="char" char=".">0.0255</td>
<td align="center">-0.0249 to 0.0751</td>
<td align="char" char=".">0.3247</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<fig id="pone.0258214.g010" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.g010</object-id>
<label>Fig 10</label>
<caption>
<title>ROC curve comparison between the external validation after retraining and the model evaluation.</title>
<p>The ‘<italic>fine</italic>_<italic>tuning</italic>’ curve indicates the external validation after retraining and ‘<italic>model</italic>_<italic>eval</italic>’ indicates the model evaluation.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.g010" xlink:type="simple"/>
</fig>
</sec>
</sec>
<sec id="sec012" sec-type="conclusions">
<title>4 Discussion</title>
<p>Currently, PET scans are used to diagnose AD by determining the level of amyloid deposition, which is assessed for severity through visual assessment by experts. We also assessed it and obtained Fleiss’ Kappa coefficient to determine it statistically, and the interreader agreement was derived as <italic>κ</italic> = 0.8950. However, this method cannot provide consistent results, as different specialists may interpret images differently. In addition, a doctor’s prior experience can have a significant impact on the reliability of the diagnostic results. Therefore, CNN-based medical image analysis, a deep learning procedure, can produce consistent results and improve confidence in the diagnosis.</p>
<p>Similar to other CNN-based neuroimaging classification studies, our model evaluation of the amyloid positivity classification problem in [<sup>18</sup>F]Florbetaben brain PET yielded an average of approximately 95% accuracy results. In addition, the CNN trained with the single institution dataset demonstrated satisfactory performance when tested with [<sup>18</sup>F]Florbetaben brain PET images obtained from the subjects in the ADNI database. These results support that this CNN model can help diagnose AD by developing a computer-aided detection tool to determine amyloid positivity since these CNN models can recognize the amyloid deposition features of the brain well.</p>
<p>In the external validation, the classification performance of the VGG 3D model was the best with an AUC of 0.945 and an accuracy of 85.3%, but the optimal model may be different if the experimental conditions are different or other model structures are performed. There was also a difference in the classification performance between the model evaluation and the external validation with the Inception3D and ResNet3D models (significance level &lt; 0.05). Thus, a method to overcome these issues is yet to be developed. This improves optimization by fine tuning [<xref ref-type="bibr" rid="pone.0258214.ref028">28</xref>, <xref ref-type="bibr" rid="pone.0258214.ref029">29</xref>] weights using the learning part or all the layers in Section 3.4.</p>
<sec id="sec013">
<title>4.1 Open platform</title>
<p>Our CNN-based [<sup>18</sup>F]Florbetaben amyloid brain PET classification studies have a limitation in that only the DAUH dataset and ADNI have been utilized. Therefore, a medical imaging artificial intelligence (AI) research platform that enables doctors with medical knowledge and medical data to perform medical AI research without programming is needed. DEEP:PHI is one such open platform (<ext-link ext-link-type="uri" xlink:href="https://www.deepphi.ai" xlink:type="simple">https://www.deepphi.ai</ext-link>). It is a research platform developed by DEEPNOID, a Korean medical AI startup company that is currently being serviced in the form of a closed beta, and a number of doctors are using this platform to conduct artificial intelligence research.</p>
<p>As shown in <xref ref-type="fig" rid="pone.0258214.g011">Fig 11</xref>, DEEP:PHI comprises a GUI, and it is possible to perform image preprocessing, neural network model generation, and neural network training results verification within the DEEP:PHI platform from the workflow window. In addition, the server provides a high-end research environment without a GPU and hard disk drive in the local environment. As it operates on the web, the platform allows doctors and developers of various organizations to collect data and perform collaborative research directly on the web. The models from our research can also be uploaded to the DEEP:PHI platform and used for various AI research. If necessary, it is possible to modify and create modules specialized for specific research through the code editor.</p>
<fig id="pone.0258214.g011" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0258214.g011</object-id>
<label>Fig 11</label>
<caption>
<title>GUI of DEEP:PHI.</title>
<p>The image preprocessing, performance, etc. can be seen in the window.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.g011" xlink:type="simple"/>
</fig>
</sec>
</sec>
<sec id="sec014" sec-type="conclusions">
<title>5 Conclusion</title>
<p>The A<italic>β</italic> classification model was evaluated and external validation was performed with the ADNI dataset. The detailed information on model evaluation and external validation results can be seen in <xref ref-type="supplementary-material" rid="pone.0258214.s001">S1 File</xref>. The model evaluation results show that the classification performance produces the high accuracy. On the other hand, data from other sources may have differences in quality when compared to the evaluation dataset, which could lead to the poor classification, and preprocessing to minimize these differences is important in external validation. Even though the data have been refined, when the deep learning classification model does not classify tasks well in the external validation step, the model performance can be improved by including other structures or retraining the model. In addition, it is possible to implement an optimal model through various research collaborations using an open platform for medical image AI research.</p>
</sec>
<sec id="sec015" sec-type="supplementary-material">
<title>Supporting information</title>
<supplementary-material id="pone.0258214.s001" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" position="float" xlink:href="info:doi/10.1371/journal.pone.0258214.s001" xlink:type="simple">
<label>S1 File</label>
<caption>
<title>A<italic>β</italic> positive probability using CNN.</title>
<p>This is the probability of predicting the label for each CNN model(EXCEL). The label is coded as A<italic>β</italic> positive 1 and A<italic>β</italic> negative 0, and if the probability exceeds 0.5, it is predicted as A<italic>β</italic> positive, and if it is less than 0.5, it is predicted as A<italic>β</italic> negative. One tab is configured for each validation type, and the meaning of the tab name is as follows:
<list list-type="bullet">
<list-item><p>model_eval: model evaluation.</p></list-item>
<list-item><p>external_val: external validation.</p></list-item>
<list-item><p>ext_additional: external validation after the fine tunning.</p></list-item>
</list></p>
<p>(XLSX)</p>
</caption>
</supplementary-material>
</sec>
</body>
<back>
<ack>
<p>This research was supported by the National Research Foundation (NRF) of Korea funded by the Ministry of Science, ICT &amp; Future Planning (NRF2018 R1A2B2008178).</p>
</ack>
<ref-list>
<title>References</title>
<ref id="pone.0258214.ref001">
<label>1</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kang</surname> <given-names>DW</given-names></name>, <name name-style="western"><surname>Lim</surname> <given-names>HK</given-names></name>. <article-title>Current Knowledge and Clinical Application of Brain Imaging in Alzheimer’s Disease</article-title>. <source>Journal of Korean Neuropsychiatric Association</source>. <year>2018</year>;<volume>57</volume>(<issue>1</issue>):<fpage>12</fpage>–<lpage>22</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.4306/jknpa.2018.57.1.12" xlink:type="simple">10.4306/jknpa.2018.57.1.12</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0258214.ref002">
<label>2</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Varghese</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Sheelakumari</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>James</surname> <given-names>JS</given-names></name>, <name name-style="western"><surname>Mathuranath</surname> <given-names>PS</given-names></name>. <article-title>A review of neuroimaging biomarkers of Alzheimer’s disease</article-title>. <source>Neurology Asia</source>. <year>2013</year>;<volume>18</volume>(<issue>3</issue>):<fpage>239</fpage>. <object-id pub-id-type="pmid">25431627</object-id></mixed-citation>
</ref>
<ref id="pone.0258214.ref003">
<label>3</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Suk</surname> <given-names>HI</given-names></name>, <name name-style="western"><surname>Lee</surname> <given-names>SW</given-names></name>, <name name-style="western"><surname>Shen</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Initiative</surname> <given-names>ADN</given-names></name>, <etal>et al</etal>. <article-title>Hierarchical feature representation and multimodal fusion with deep learning for AD/MCI diagnosis</article-title>. <source>NeuroImage</source>. <year>2014</year>;<volume>101</volume>:<fpage>569</fpage>–<lpage>582</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.neuroimage.2014.06.077" xlink:type="simple">10.1016/j.neuroimage.2014.06.077</ext-link></comment> <object-id pub-id-type="pmid">25042445</object-id></mixed-citation>
</ref>
<ref id="pone.0258214.ref004">
<label>4</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Suk</surname> <given-names>HI</given-names></name>, <name name-style="western"><surname>Lee</surname> <given-names>SW</given-names></name>, <name name-style="western"><surname>Shen</surname> <given-names>D</given-names></name>. <article-title>Latent feature representation with stacked auto-encoder for AD/MCI diagnosis</article-title>. <source>Brain Structure and Function</source>. <year>2015</year>;<volume>220</volume>(<issue>2</issue>):<fpage>841</fpage>–<lpage>859</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s00429-013-0687-3" xlink:type="simple">10.1007/s00429-013-0687-3</ext-link></comment> <object-id pub-id-type="pmid">24363140</object-id></mixed-citation>
</ref>
<ref id="pone.0258214.ref005">
<label>5</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Shi</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Zheng</surname> <given-names>X</given-names></name>, <name name-style="western"><surname>Li</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Zhang</surname> <given-names>Q</given-names></name>, <name name-style="western"><surname>Ying</surname> <given-names>S</given-names></name>. <article-title>Multimodal neuroimaging feature learning with multimodal stacked deep polynomial networks for diagnosis of Alzheimer’s disease</article-title>. <source>IEEE journal of biomedical and health informatics</source>. <year>2017</year>;<volume>22</volume>(<issue>1</issue>):<fpage>173</fpage>–<lpage>183</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/JBHI.2017.2655720" xlink:type="simple">10.1109/JBHI.2017.2655720</ext-link></comment> <object-id pub-id-type="pmid">28113353</object-id></mixed-citation>
</ref>
<ref id="pone.0258214.ref006">
<label>6</label>
<mixed-citation publication-type="other" xlink:type="simple">Comelli A, Stefano A, Bignardi S, Coronnello C, Russo G, Sabini MG, et al. Tissue classification to support local active delineation of brain tumors. In: Annual Conference on Medical Image Understanding and Analysis. Springer; 2019. p. 3–14.</mixed-citation>
</ref>
<ref id="pone.0258214.ref007">
<label>7</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Stefano</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Comelli</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Bravatà</surname> <given-names>V</given-names></name>, <name name-style="western"><surname>Barone</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Daskalovski</surname> <given-names>I</given-names></name>, <name name-style="western"><surname>Savoca</surname> <given-names>G</given-names></name>, <etal>et al</etal>. <article-title>A preliminary PET radiomics study of brain metastases using a fully automatic segmentation method</article-title>. <source>BMC bioinformatics</source>. <year>2020</year>;<volume>21</volume>(<issue>8</issue>):<fpage>1</fpage>–<lpage>14</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/s12859-020-03647-7" xlink:type="simple">10.1186/s12859-020-03647-7</ext-link></comment> <object-id pub-id-type="pmid">32938360</object-id></mixed-citation>
</ref>
<ref id="pone.0258214.ref008">
<label>8</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Cho</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Kim</surname> <given-names>WG</given-names></name>, <name name-style="western"><surname>Kang</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Yang</surname> <given-names>GS</given-names></name>, <name name-style="western"><surname>Kim</surname> <given-names>HW</given-names></name>, <name name-style="western"><surname>Jeong</surname> <given-names>JE</given-names></name>, <etal>et al</etal>. <article-title>Classification of 18 F-Florbetaben Amyloid Brain PET Image using PCA-SVM</article-title>. <source>Biomedical Science Letters</source>. <year>2019</year>;<volume>25</volume>(<issue>1</issue>):<fpage>99</fpage>–<lpage>106</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.15616/BSL.2019.25.1.99" xlink:type="simple">10.15616/BSL.2019.25.1.99</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0258214.ref009">
<label>9</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kang</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Kim</surname> <given-names>WG</given-names></name>, <name name-style="western"><surname>Yang</surname> <given-names>GS</given-names></name>, <name name-style="western"><surname>Kim</surname> <given-names>HW</given-names></name>, <name name-style="western"><surname>Jeong</surname> <given-names>JE</given-names></name>, <name name-style="western"><surname>Yoon</surname> <given-names>HJ</given-names></name>, <etal>et al</etal>. <article-title>VGG-based BAPL score classification of 18F-florbetaben amyloid brain PET</article-title>. <source>Biomedical Science Letters</source>. <year>2018</year>;<volume>24</volume>(<issue>4</issue>):<fpage>418</fpage>–<lpage>425</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.15616/BSL.2018.24.4.418" xlink:type="simple">10.15616/BSL.2018.24.4.418</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0258214.ref010">
<label>10</label>
<mixed-citation publication-type="other" xlink:type="simple">Simonyan K, Zisserman A. Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:14091556. 2014;.</mixed-citation>
</ref>
<ref id="pone.0258214.ref011">
<label>11</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Suzuki</surname> <given-names>K</given-names></name>. <article-title>Overview of deep learning in medical imaging</article-title>. <source>Radiological physics and technology</source>. <year>2017</year>;<volume>10</volume>(<issue>3</issue>):<fpage>257</fpage>–<lpage>273</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s12194-017-0406-5" xlink:type="simple">10.1007/s12194-017-0406-5</ext-link></comment> <object-id pub-id-type="pmid">28689314</object-id></mixed-citation>
</ref>
<ref id="pone.0258214.ref012">
<label>12</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Litjens</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Kooi</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Bejnordi</surname> <given-names>BE</given-names></name>, <name name-style="western"><surname>Setio</surname> <given-names>AAA</given-names></name>, <name name-style="western"><surname>Ciompi</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Ghafoorian</surname> <given-names>M</given-names></name>, <etal>et al</etal>. <article-title>A survey on deep learning in medical image analysis</article-title>. <source>Medical image analysis</source>. <year>2017</year>;<volume>42</volume>:<fpage>60</fpage>–<lpage>88</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.media.2017.07.005" xlink:type="simple">10.1016/j.media.2017.07.005</ext-link></comment> <object-id pub-id-type="pmid">28778026</object-id></mixed-citation>
</ref>
<ref id="pone.0258214.ref013">
<label>13</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Liu</surname> <given-names>KL</given-names></name>, <name name-style="western"><surname>Wu</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Chen</surname> <given-names>PT</given-names></name>, <name name-style="western"><surname>Tsai</surname> <given-names>YM</given-names></name>, <name name-style="western"><surname>Roth</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Wu</surname> <given-names>MS</given-names></name>, <etal>et al</etal>. <article-title>Deep learning to distinguish pancreatic cancer tissue from non-cancerous pancreatic tissue: a retrospective study with cross-racial external validation</article-title>. <source>The Lancet Digital Health</source>. <year>2020</year>;<volume>2</volume>(<issue>6</issue>):<fpage>e303</fpage>–<lpage>e313</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/S2589-7500(20)30078-9" xlink:type="simple">10.1016/S2589-7500(20)30078-9</ext-link></comment> <object-id pub-id-type="pmid">33328124</object-id></mixed-citation>
</ref>
<ref id="pone.0258214.ref014">
<label>14</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Baldwin</surname> <given-names>DR</given-names></name>, <name name-style="western"><surname>Gustafson</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Pickup</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Arteta</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Novotny</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Declerck</surname> <given-names>J</given-names></name>, <etal>et al</etal>. <article-title>External validation of a convolutional neural network artificial intelligence tool to predict malignancy in pulmonary nodules</article-title>. <source>Thorax</source>. <year>2020</year>;<volume>75</volume>(<issue>4</issue>):<fpage>306</fpage>–<lpage>312</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1136/thoraxjnl-2019-214104" xlink:type="simple">10.1136/thoraxjnl-2019-214104</ext-link></comment> <object-id pub-id-type="pmid">32139611</object-id></mixed-citation>
</ref>
<ref id="pone.0258214.ref015">
<label>15</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Ashburner</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Friston</surname> <given-names>KJ</given-names></name>. <article-title>Nonlinear spatial normalization using basis functions</article-title>. <source>Human brain mapping</source>. <year>1999</year>;<volume>7</volume>(<issue>4</issue>):<fpage>254</fpage>–<lpage>266</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/(SICI)1097-0193(1999)7:4&lt;254::AID-HBM4&gt;3.0.CO;2-G" xlink:type="simple">10.1002/(SICI)1097-0193(1999)7:4&lt;254::AID-HBM4&gt;3.0.CO;2-G</ext-link></comment> <object-id pub-id-type="pmid">10408769</object-id></mixed-citation>
</ref>
<ref id="pone.0258214.ref016">
<label>16</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Schmidt</surname> <given-names>ME</given-names></name>, <name name-style="western"><surname>Matthews</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Andrews</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Mosconi</surname> <given-names>L</given-names></name>. <chapter-title>Positron emission tomography in Alzheimer disease: diagnosis and use as biomarker endpoints</chapter-title>. In: <source>Translational Neuroimaging</source>. <publisher-name>Elsevier</publisher-name>; <year>2013</year>. p. <fpage>131</fpage>–<lpage>174</lpage>.</mixed-citation>
</ref>
<ref id="pone.0258214.ref017">
<label>17</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Win</surname> <given-names>TP</given-names></name>, <name name-style="western"><surname>Hosokai</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Minagawa</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Muroi</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Miwa</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Maruyama</surname> <given-names>A</given-names></name>, <etal>et al</etal>. <article-title>Comparison of Count Normalization Methods for Statistical Parametric Mapping Analysis Using a Digital Brain Phantom Obtained from Fluorodeoxyglucose-positron Emission Tomography</article-title>. <source>Asia Oceania Journal of Nuclear Medicine and Biology</source>. <year>2019</year>;<volume>7</volume>(<issue>1</issue>):<fpage>58</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.22038/AOJNMB.2018.11745" xlink:type="simple">10.22038/AOJNMB.2018.11745</ext-link></comment> <object-id pub-id-type="pmid">30705912</object-id></mixed-citation>
</ref>
<ref id="pone.0258214.ref018">
<label>18</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kalavathi</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Prasath</surname> <given-names>VS</given-names></name>. <article-title>Methods on skull stripping of MRI head scan images—a review</article-title>. <source>Journal of digital imaging</source>. <year>2016</year>;<volume>29</volume>(<issue>3</issue>):<fpage>365</fpage>–<lpage>379</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s10278-015-9847-8" xlink:type="simple">10.1007/s10278-015-9847-8</ext-link></comment> <object-id pub-id-type="pmid">26628083</object-id></mixed-citation>
</ref>
<ref id="pone.0258214.ref019">
<label>19</label>
<mixed-citation publication-type="other" xlink:type="simple">Szegedy C, Liu W, Jia Y, Sermanet P, Reed S, Anguelov D, et al. Going deeper with convolutions. In: Proceedings of the IEEE conference on computer vision and pattern recognition; 2015. p. 1–9.</mixed-citation>
</ref>
<ref id="pone.0258214.ref020">
<label>20</label>
<mixed-citation publication-type="other" xlink:type="simple">Szegedy C, Vanhoucke V, Ioffe S, Shlens J, Wojna Z. Rethinking the inception architecture for computer vision. In: Proceedings of the IEEE conference on computer vision and pattern recognition; 2016. p. 2818–2826.</mixed-citation>
</ref>
<ref id="pone.0258214.ref021">
<label>21</label>
<mixed-citation publication-type="other" xlink:type="simple">He K, Zhang X, Ren S, Sun J. Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition; 2016. p. 770–778.</mixed-citation>
</ref>
<ref id="pone.0258214.ref022">
<label>22</label>
<mixed-citation publication-type="other" xlink:type="simple">Ioffe S, Szegedy C. Batch normalization: Accelerating deep network training by reducing internal covariate shift. In: International conference on machine learning. PMLR; 2015. p. 448–456.</mixed-citation>
</ref>
<ref id="pone.0258214.ref023">
<label>23</label>
<mixed-citation publication-type="other" xlink:type="simple">Nair V, Hinton GE. Rectified Linear Units Improve Restricted Boltzmann Machines. In: ICML; 2010. p. 807–814. Available from: <ext-link ext-link-type="uri" xlink:href="https://icml.cc/Conferences/2010/papers/432.pdf" xlink:type="simple">https://icml.cc/Conferences/2010/papers/432.pdf</ext-link>.</mixed-citation>
</ref>
<ref id="pone.0258214.ref024">
<label>24</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Srivastava</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Hinton</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Krizhevsky</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Sutskever</surname> <given-names>I</given-names></name>, <name name-style="western"><surname>Salakhutdinov</surname> <given-names>R</given-names></name>. <article-title>Dropout: a simple way to prevent neural networks from overfitting</article-title>. <source>The journal of machine learning research</source>. <year>2014</year>;<volume>15</volume>(<issue>1</issue>):<fpage>1929</fpage>–<lpage>1958</lpage>.</mixed-citation>
</ref>
<ref id="pone.0258214.ref025">
<label>25</label>
<mixed-citation publication-type="other" xlink:type="simple">Hosseini-Asl E, Keynton R, El-Baz A. Alzheimer’s disease diagnostics by adaptation of 3D convolutional network. In: 2016 IEEE International Conference on Image Processing (ICIP). IEEE; 2016. p. 126–130.</mixed-citation>
</ref>
<ref id="pone.0258214.ref026">
<label>26</label>
<mixed-citation publication-type="other" xlink:type="simple">Raschka S. Model evaluation, model selection, and algorithm selection in machine learning. arXiv preprint arXiv:181112808. 2018;.</mixed-citation>
</ref>
<ref id="pone.0258214.ref027">
<label>27</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Van der Maaten</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Hinton</surname> <given-names>G</given-names></name>. <article-title>Visualizing data using t-SNE</article-title>. <source>Journal of machine learning research</source>. <year>2008</year>;<volume>9</volume>(<issue>11</issue>).</mixed-citation>
</ref>
<ref id="pone.0258214.ref028">
<label>28</label>
<mixed-citation publication-type="other" xlink:type="simple">Hussain M, Bird JJ, Faria DR. A study on cnn transfer learning for image classification. In: UK Workshop on computational Intelligence. Springer; 2018. p. 191–202.</mixed-citation>
</ref>
<ref id="pone.0258214.ref029">
<label>29</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Pan</surname> <given-names>SJ</given-names></name>, <name name-style="western"><surname>Yang</surname> <given-names>Q</given-names></name>. <article-title>A survey on transfer learning</article-title>. <source>IEEE Transactions on knowledge and data engineering</source>. <year>2009</year>;<volume>22</volume>(<issue>10</issue>):<fpage>1345</fpage>–<lpage>1359</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/TKDE.2009.191" xlink:type="simple">10.1109/TKDE.2009.191</ext-link></comment></mixed-citation>
</ref>
</ref-list>
</back>
</article>